diff --git "a/wandb/run-20220302_094439-2kys49al/files/wandb-summary.json" "b/wandb/run-20220302_094439-2kys49al/files/wandb-summary.json" --- "a/wandb/run-20220302_094439-2kys49al/files/wandb-summary.json" +++ "b/wandb/run-20220302_094439-2kys49al/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 6.4242, "train/learning_rate": 2.7059111851779235e-05, "train/epoch": 0.42, "train/global_step": 1500, "_runtime": 6296, "_timestamp": 1646220575, "_step": 1502, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 22.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 30431.0, 32.0, 12.0, 6.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2968.0, -2902.34375, -2836.6875, -2771.03125, -2705.375, -2639.71875, -2574.0625, -2508.40625, -2442.75, -2377.09375, -2311.4375, -2245.78125, -2180.125, -2114.46875, -2048.8125, -1983.15625, -1917.5, -1851.84375, -1786.1875, -1720.53125, -1654.875, -1589.21875, -1523.5625, -1457.90625, -1392.25, -1326.59375, -1260.9375, -1195.28125, -1129.625, -1063.96875, -998.3125, -932.65625, -867.0, -801.34375, -735.6875, -670.03125, -604.375, -538.71875, -473.0625, -407.40625, -341.75, -276.09375, -210.4375, -144.78125, -79.125, -13.46875, 52.1875, 117.84375, 183.5, 249.15625, 314.8125, 380.46875, 446.125, 511.78125, 577.4375, 643.09375, 708.75, 774.40625, 840.0625, 905.71875, 971.375, 1037.03125, 1102.6875, 1168.34375, 1234.0]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 5.0, 2.0, 0.0, 4.0, 5.0, 6.0, 4.0, 9.0, 13.0, 20.0, 29.0, 33.0, 56.0, 59.0, 72.0, 98.0, 112.0, 86.0, 103.0, 77.0, 60.0, 46.0, 32.0, 21.0, 19.0, 10.0, 5.0, 5.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-539.41552734375, -519.9755249023438, -500.5354919433594, -481.095458984375, -461.65545654296875, -442.2154235839844, -422.775390625, -403.33538818359375, -383.8953552246094, -364.455322265625, -345.01531982421875, -325.5752868652344, -306.13525390625, -286.69525146484375, -267.2552185058594, -247.81520080566406, -228.37518310546875, -208.93516540527344, -189.49514770507812, -170.05511474609375, -150.61509704589844, -131.17507934570312, -111.73505401611328, -92.29502868652344, -72.85501098632812, -53.41498947143555, -33.97496795654297, -14.53494644165039, 4.9050750732421875, 24.3450927734375, 43.785118103027344, 63.22514343261719, 82.66510009765625, 102.10511779785156, 121.5451431274414, 140.98516845703125, 160.42518615722656, 179.86520385742188, 199.30523681640625, 218.74525451660156, 238.18527221679688, 257.62530517578125, 277.0653076171875, 296.5053405761719, 315.94537353515625, 335.3853759765625, 354.8254089355469, 374.26544189453125, 393.7054443359375, 413.1454772949219, 432.5854797363281, 452.0255126953125, 471.46551513671875, 490.9055480957031, 510.3455810546875, 529.7855834960938, 549.2255859375, 568.6655883789062, 588.1056518554688, 607.545654296875, 626.9856567382812, 646.4256591796875, 665.86572265625, 685.3057250976562, 704.7457885742188]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 6.0, 10.0, 11.0, 5.0, 12.0, 16.0, 18.0, 29.0, 24.0, 29.0, 26.0, 31.0, 46.0, 37.0, 41.0, 36.0, 39.0, 44.0, 57.0, 44.0, 50.0, 56.0, 54.0, 42.0, 20.0, 36.0, 25.0, 28.0, 24.0, 22.0, 19.0, 12.0, 8.0, 12.0, 13.0, 8.0, 2.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-378.13671875, -364.7825927734375, -351.4284973144531, -338.07440185546875, -324.72027587890625, -311.36614990234375, -298.0120544433594, -284.657958984375, -271.3038330078125, -257.94970703125, -244.59561157226562, -231.2415008544922, -217.88739013671875, -204.5332794189453, -191.17916870117188, -177.82505798339844, -164.470947265625, -151.11683654785156, -137.76272583007812, -124.40861511230469, -111.05450439453125, -97.70039367675781, -84.34628295898438, -70.99217224121094, -57.6380615234375, -44.28395080566406, -30.929840087890625, -17.575729370117188, -4.22161865234375, 9.132492065429688, 22.486602783203125, 35.84071350097656, 49.19482421875, 62.54893493652344, 75.90304565429688, 89.25715637207031, 102.61126708984375, 115.96537780761719, 129.31948852539062, 142.67359924316406, 156.0277099609375, 169.38182067871094, 182.73593139648438, 196.0900421142578, 209.44415283203125, 222.7982635498047, 236.15237426757812, 249.50648498535156, 262.860595703125, 276.2147216796875, 289.5688171386719, 302.92291259765625, 316.27703857421875, 329.63116455078125, 342.9852600097656, 356.33935546875, 369.6934814453125, 383.047607421875, 396.4017028808594, 409.75579833984375, 423.10992431640625, 436.46405029296875, 449.8181457519531, 463.1722412109375, 476.5263671875]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 8.0, 9.0, 15.0, 19.0, 27.0, 40.0, 76.0, 102.0, 134.0, 194.0, 384.0, 546.0, 993.0, 1601.0, 2791.0, 5208.0, 10066.0, 21752.0, 50413.0, 160923.0, 618910.0, 101845.0, 37706.0, 16472.0, 8140.0, 4253.0, 2360.0, 1379.0, 818.0, 495.0, 309.0, 195.0, 127.0, 79.0, 51.0, 38.0, 26.0, 15.0, 9.0, 11.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1651.0, -1596.578125, -1542.15625, -1487.734375, -1433.3125, -1378.890625, -1324.46875, -1270.046875, -1215.625, -1161.203125, -1106.78125, -1052.359375, -997.9375, -943.515625, -889.09375, -834.671875, -780.25, -725.828125, -671.40625, -616.984375, -562.5625, -508.140625, -453.71875, -399.296875, -344.875, -290.453125, -236.03125, -181.609375, -127.1875, -72.765625, -18.34375, 36.078125, 90.5, 144.921875, 199.34375, 253.765625, 308.1875, 362.609375, 417.03125, 471.453125, 525.875, 580.296875, 634.71875, 689.140625, 743.5625, 797.984375, 852.40625, 906.828125, 961.25, 1015.671875, 1070.09375, 1124.515625, 1178.9375, 1233.359375, 1287.78125, 1342.203125, 1396.625, 1451.046875, 1505.46875, 1559.890625, 1614.3125, 1668.734375, 1723.15625, 1777.578125, 1832.0]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 6.0, 7.0, 14.0, 13.0, 13.0, 21.0, 27.0, 18.0, 35.0, 50.0, 99.0, 171.0, 196.0, 81.0, 39.0, 34.0, 34.0, 32.0, 19.0, 17.0, 15.0, 6.0, 7.0, 11.0, 2.0, 4.0, 7.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-343.25, -329.53515625, -315.8203125, -302.10546875, -288.390625, -274.67578125, -260.9609375, -247.24609375, -233.53125, -219.81640625, -206.1015625, -192.38671875, -178.671875, -164.95703125, -151.2421875, -137.52734375, -123.8125, -110.09765625, -96.3828125, -82.66796875, -68.953125, -55.23828125, -41.5234375, -27.80859375, -14.09375, -0.37890625, 13.3359375, 27.05078125, 40.765625, 54.48046875, 68.1953125, 81.91015625, 95.625, 109.33984375, 123.0546875, 136.76953125, 150.484375, 164.19921875, 177.9140625, 191.62890625, 205.34375, 219.05859375, 232.7734375, 246.48828125, 260.203125, 273.91796875, 287.6328125, 301.34765625, 315.0625, 328.77734375, 342.4921875, 356.20703125, 369.921875, 383.63671875, 397.3515625, 411.06640625, 424.78125, 438.49609375, 452.2109375, 465.92578125, 479.640625, 493.35546875, 507.0703125, 520.78515625, 534.5]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 7.0, 8.0, 15.0, 19.0, 16.0, 37.0, 39.0, 48.0, 53.0, 65.0, 99.0, 114.0, 107.0, 78.0, 75.0, 46.0, 38.0, 31.0, 28.0, 11.0, 10.0, 17.0, 9.0, 8.0, 1.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-287.3674621582031, -279.0684814453125, -270.76947021484375, -262.4704895019531, -254.1715087890625, -245.8725128173828, -237.57351684570312, -229.2745361328125, -220.9755401611328, -212.67654418945312, -204.3775634765625, -196.0785675048828, -187.77957153320312, -179.4805908203125, -171.1815948486328, -162.88259887695312, -154.5836181640625, -146.2846221923828, -137.9856414794922, -129.6866455078125, -121.38765716552734, -113.08866882324219, -104.7896728515625, -96.49068450927734, -88.19169616699219, -79.89270782470703, -71.59371948242188, -63.29472351074219, -54.99573516845703, -46.696746826171875, -38.39775466918945, -30.09876251220703, -21.7998046875, -13.500814437866211, -5.201824188232422, 3.097166061401367, 11.396156311035156, 19.695144653320312, 27.994136810302734, 36.293128967285156, 44.59211730957031, 52.89110565185547, 61.19009780883789, 69.48908996582031, 77.78807830810547, 86.08706665039062, 94.38606262207031, 102.68505096435547, 110.98403930664062, 119.28302764892578, 127.58201599121094, 135.88101196289062, 144.17999267578125, 152.47898864746094, 160.77798461914062, 169.07696533203125, 177.37596130371094, 185.67495727539062, 193.97393798828125, 202.27293395996094, 210.57192993164062, 218.87091064453125, 227.16990661621094, 235.46890258789062, 243.76788330078125]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 10.0, 3.0, 11.0, 9.0, 9.0, 11.0, 15.0, 19.0, 23.0, 22.0, 17.0, 34.0, 41.0, 40.0, 45.0, 35.0, 46.0, 27.0, 47.0, 44.0, 31.0, 38.0, 43.0, 37.0, 41.0, 34.0, 38.0, 37.0, 17.0, 17.0, 22.0, 22.0, 14.0, 14.0, 20.0, 18.0, 15.0, 8.0, 4.0, 2.0, 7.0, 3.0, 3.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-157.59765625, -152.5367431640625, -147.475830078125, -142.41493225097656, -137.35401916503906, -132.29310607910156, -127.2322006225586, -122.17129516601562, -117.11038208007812, -112.04946899414062, -106.98856353759766, -101.92765808105469, -96.86674499511719, -91.80583190917969, -86.74492645263672, -81.68402099609375, -76.62310791015625, -71.56219482421875, -66.50128936767578, -61.44038009643555, -56.37947082519531, -51.31856155395508, -46.257652282714844, -41.19674301147461, -36.135833740234375, -31.07492446899414, -26.014015197753906, -20.953105926513672, -15.892196655273438, -10.831287384033203, -5.770378112792969, -0.7094688415527344, 4.3514404296875, 9.412349700927734, 14.473258972167969, 19.534168243408203, 24.595077514648438, 29.655986785888672, 34.716896057128906, 39.77780532836914, 44.838714599609375, 49.89962387084961, 54.960533142089844, 60.02144241333008, 65.08235168457031, 70.14326477050781, 75.20417022705078, 80.26507568359375, 85.32598876953125, 90.38690185546875, 95.44780731201172, 100.50871276855469, 105.56962585449219, 110.63053894042969, 115.69144439697266, 120.75234985351562, 125.81326293945312, 130.87417602539062, 135.93508911132812, 140.99598693847656, 146.05690002441406, 151.11781311035156, 156.1787109375, 161.2396240234375, 166.300537109375]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 2.0, 4.0, 4.0, 8.0, 4.0, 16.0, 22.0, 36.0, 42.0, 61.0, 105.0, 150.0, 192.0, 305.0, 447.0, 677.0, 1047.0, 1508.0, 2238.0, 3383.0, 5195.0, 7884.0, 12635.0, 20328.0, 34347.0, 60817.0, 121803.0, 423393.0, 1853023.0, 1208628.0, 224570.0, 89168.0, 47373.0, 27448.0, 16411.0, 10457.0, 6790.0, 4454.0, 2990.0, 2012.0, 1386.0, 883.0, 619.0, 417.0, 304.0, 233.0, 141.0, 107.0, 73.0, 48.0, 30.0, 25.0, 22.0, 8.0, 8.0, 1.0, 8.0, 2.0, 1.0, 2.0, 1.0], "bins": [-203.625, -197.22265625, -190.8203125, -184.41796875, -178.015625, -171.61328125, -165.2109375, -158.80859375, -152.40625, -146.00390625, -139.6015625, -133.19921875, -126.796875, -120.39453125, -113.9921875, -107.58984375, -101.1875, -94.78515625, -88.3828125, -81.98046875, -75.578125, -69.17578125, -62.7734375, -56.37109375, -49.96875, -43.56640625, -37.1640625, -30.76171875, -24.359375, -17.95703125, -11.5546875, -5.15234375, 1.25, 7.65234375, 14.0546875, 20.45703125, 26.859375, 33.26171875, 39.6640625, 46.06640625, 52.46875, 58.87109375, 65.2734375, 71.67578125, 78.078125, 84.48046875, 90.8828125, 97.28515625, 103.6875, 110.08984375, 116.4921875, 122.89453125, 129.296875, 135.69921875, 142.1015625, 148.50390625, 154.90625, 161.30859375, 167.7109375, 174.11328125, 180.515625, 186.91796875, 193.3203125, 199.72265625, 206.125]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 6.0, 6.0, 10.0, 11.0, 11.0, 17.0, 10.0, 12.0, 25.0, 16.0, 14.0, 31.0, 17.0, 31.0, 41.0, 35.0, 33.0, 52.0, 32.0, 42.0, 46.0, 37.0, 42.0, 47.0, 37.0, 33.0, 30.0, 26.0, 35.0, 35.0, 16.0, 22.0, 20.0, 15.0, 22.0, 8.0, 15.0, 20.0, 8.0, 6.0, 9.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-79.0, -76.5439453125, -74.087890625, -71.6318359375, -69.17578125, -66.7197265625, -64.263671875, -61.8076171875, -59.3515625, -56.8955078125, -54.439453125, -51.9833984375, -49.52734375, -47.0712890625, -44.615234375, -42.1591796875, -39.703125, -37.2470703125, -34.791015625, -32.3349609375, -29.87890625, -27.4228515625, -24.966796875, -22.5107421875, -20.0546875, -17.5986328125, -15.142578125, -12.6865234375, -10.23046875, -7.7744140625, -5.318359375, -2.8623046875, -0.40625, 2.0498046875, 4.505859375, 6.9619140625, 9.41796875, 11.8740234375, 14.330078125, 16.7861328125, 19.2421875, 21.6982421875, 24.154296875, 26.6103515625, 29.06640625, 31.5224609375, 33.978515625, 36.4345703125, 38.890625, 41.3466796875, 43.802734375, 46.2587890625, 48.71484375, 51.1708984375, 53.626953125, 56.0830078125, 58.5390625, 60.9951171875, 63.451171875, 65.9072265625, 68.36328125, 70.8193359375, 73.275390625, 75.7314453125, 78.1875]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 10.0, 14.0, 23.0, 32.0, 44.0, 68.0, 93.0, 158.0, 233.0, 352.0, 528.0, 739.0, 1225.0, 2040.0, 3252.0, 5606.0, 9392.0, 16739.0, 31301.0, 62263.0, 133289.0, 325304.0, 1279877.0, 1652997.0, 373842.0, 148220.0, 68332.0, 34135.0, 18227.0, 10467.0, 5984.0, 3531.0, 2140.0, 1333.0, 861.0, 566.0, 342.0, 243.0, 153.0, 101.0, 80.0, 47.0, 29.0, 26.0, 12.0, 10.0, 12.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-172.75, -167.189453125, -161.62890625, -156.068359375, -150.5078125, -144.947265625, -139.38671875, -133.826171875, -128.265625, -122.705078125, -117.14453125, -111.583984375, -106.0234375, -100.462890625, -94.90234375, -89.341796875, -83.78125, -78.220703125, -72.66015625, -67.099609375, -61.5390625, -55.978515625, -50.41796875, -44.857421875, -39.296875, -33.736328125, -28.17578125, -22.615234375, -17.0546875, -11.494140625, -5.93359375, -0.373046875, 5.1875, 10.748046875, 16.30859375, 21.869140625, 27.4296875, 32.990234375, 38.55078125, 44.111328125, 49.671875, 55.232421875, 60.79296875, 66.353515625, 71.9140625, 77.474609375, 83.03515625, 88.595703125, 94.15625, 99.716796875, 105.27734375, 110.837890625, 116.3984375, 121.958984375, 127.51953125, 133.080078125, 138.640625, 144.201171875, 149.76171875, 155.322265625, 160.8828125, 166.443359375, 172.00390625, 177.564453125, 183.125]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 8.0, 5.0, 6.0, 9.0, 7.0, 9.0, 20.0, 23.0, 27.0, 26.0, 46.0, 53.0, 63.0, 73.0, 99.0, 118.0, 176.0, 215.0, 278.0, 496.0, 686.0, 432.0, 275.0, 194.0, 170.0, 103.0, 106.0, 71.0, 56.0, 40.0, 38.0, 39.0, 24.0, 14.0, 12.0, 14.0, 14.0, 8.0, 4.0, 6.0, 7.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.46875, -48.861328125, -47.25390625, -45.646484375, -44.0390625, -42.431640625, -40.82421875, -39.216796875, -37.609375, -36.001953125, -34.39453125, -32.787109375, -31.1796875, -29.572265625, -27.96484375, -26.357421875, -24.75, -23.142578125, -21.53515625, -19.927734375, -18.3203125, -16.712890625, -15.10546875, -13.498046875, -11.890625, -10.283203125, -8.67578125, -7.068359375, -5.4609375, -3.853515625, -2.24609375, -0.638671875, 0.96875, 2.576171875, 4.18359375, 5.791015625, 7.3984375, 9.005859375, 10.61328125, 12.220703125, 13.828125, 15.435546875, 17.04296875, 18.650390625, 20.2578125, 21.865234375, 23.47265625, 25.080078125, 26.6875, 28.294921875, 29.90234375, 31.509765625, 33.1171875, 34.724609375, 36.33203125, 37.939453125, 39.546875, 41.154296875, 42.76171875, 44.369140625, 45.9765625, 47.583984375, 49.19140625, 50.798828125, 52.40625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 6.0, 10.0, 14.0, 8.0, 10.0, 13.0, 22.0, 26.0, 37.0, 43.0, 61.0, 65.0, 73.0, 66.0, 77.0, 98.0, 68.0, 52.0, 56.0, 47.0, 22.0, 23.0, 22.0, 12.0, 17.0, 8.0, 7.0, 6.0, 2.0, 3.0, 6.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-119.94526672363281, -116.22440338134766, -112.50354766845703, -108.78268432617188, -105.06182861328125, -101.3409652709961, -97.62010192871094, -93.89924621582031, -90.17839050292969, -86.45752716064453, -82.7366714477539, -79.01580810546875, -75.29495239257812, -71.57408905029297, -67.85322570800781, -64.13236999511719, -60.41150665283203, -56.69064712524414, -52.96978759765625, -49.248924255371094, -45.52806854248047, -41.80720520019531, -38.08634567260742, -34.36548614501953, -30.64462661743164, -26.92376708984375, -23.20290756225586, -19.482046127319336, -15.761186599731445, -12.040327072143555, -8.319465637207031, -4.598606109619141, -0.87774658203125, 2.843113422393799, 6.563973426818848, 10.284833908081055, 14.005693435668945, 17.726552963256836, 21.44741439819336, 25.16827392578125, 28.88913345336914, 32.60999298095703, 36.33085250854492, 40.05171203613281, 43.77257537841797, 47.493431091308594, 51.21429443359375, 54.93515396118164, 58.65601348876953, 62.37687301635742, 66.09773254394531, 69.81859588623047, 73.5394515991211, 77.26031494140625, 80.98117065429688, 84.70203399658203, 88.42289733886719, 92.14376068115234, 95.86461639404297, 99.58547973632812, 103.30633544921875, 107.0271987915039, 110.74806213378906, 114.46891784667969, 118.18977355957031]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 8.0, 5.0, 12.0, 8.0, 11.0, 17.0, 17.0, 16.0, 25.0, 35.0, 26.0, 35.0, 31.0, 35.0, 45.0, 33.0, 45.0, 38.0, 40.0, 47.0, 39.0, 38.0, 41.0, 46.0, 25.0, 32.0, 40.0, 23.0, 32.0, 18.0, 23.0, 23.0, 9.0, 9.0, 15.0, 9.0, 12.0, 7.0, 6.0, 6.0, 2.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-84.60026550292969, -81.89408111572266, -79.18790435791016, -76.48171997070312, -73.7755355834961, -71.0693588256836, -68.36317443847656, -65.65699768066406, -62.95081329345703, -60.244632720947266, -57.538448333740234, -54.83226776123047, -52.1260871887207, -49.41990661621094, -46.713722229003906, -44.00754165649414, -41.30135726928711, -38.595176696777344, -35.88899230957031, -33.18281173706055, -30.47663116455078, -27.770448684692383, -25.064266204833984, -22.35808563232422, -19.65190315246582, -16.945720672607422, -14.239540100097656, -11.533357620239258, -8.827176094055176, -6.120994567871094, -3.4148120880126953, -0.7086315155029297, 1.9975509643554688, 4.703732490539551, 7.409914493560791, 10.116096496582031, 12.822278022766113, 15.528459548950195, 18.234642028808594, 20.94082260131836, 23.647005081176758, 26.353187561035156, 29.059368133544922, 31.76555061340332, 34.47173309326172, 37.177913665771484, 39.88409423828125, 42.59027862548828, 45.29645919799805, 48.00263977050781, 50.708824157714844, 53.41500473022461, 56.121185302734375, 58.827369689941406, 61.53355026245117, 64.23973083496094, 66.94591522216797, 69.652099609375, 72.3582763671875, 75.06446075439453, 77.77064514160156, 80.47682189941406, 83.1830062866211, 85.88919067382812, 88.59536743164062]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 5.0, 2.0, 3.0, 3.0, 8.0, 12.0, 17.0, 27.0, 30.0, 42.0, 62.0, 88.0, 162.0, 244.0, 361.0, 550.0, 778.0, 1183.0, 1817.0, 2905.0, 4526.0, 7353.0, 11191.0, 18114.0, 28972.0, 46528.0, 75303.0, 126659.0, 208552.0, 200165.0, 120684.0, 72744.0, 44176.0, 27758.0, 17265.0, 10960.0, 6982.0, 4341.0, 2764.0, 1753.0, 1177.0, 774.0, 511.0, 334.0, 230.0, 130.0, 115.0, 76.0, 36.0, 26.0, 18.0, 18.0, 10.0, 10.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0], "bins": [-46.40625, -44.998046875, -43.58984375, -42.181640625, -40.7734375, -39.365234375, -37.95703125, -36.548828125, -35.140625, -33.732421875, -32.32421875, -30.916015625, -29.5078125, -28.099609375, -26.69140625, -25.283203125, -23.875, -22.466796875, -21.05859375, -19.650390625, -18.2421875, -16.833984375, -15.42578125, -14.017578125, -12.609375, -11.201171875, -9.79296875, -8.384765625, -6.9765625, -5.568359375, -4.16015625, -2.751953125, -1.34375, 0.064453125, 1.47265625, 2.880859375, 4.2890625, 5.697265625, 7.10546875, 8.513671875, 9.921875, 11.330078125, 12.73828125, 14.146484375, 15.5546875, 16.962890625, 18.37109375, 19.779296875, 21.1875, 22.595703125, 24.00390625, 25.412109375, 26.8203125, 28.228515625, 29.63671875, 31.044921875, 32.453125, 33.861328125, 35.26953125, 36.677734375, 38.0859375, 39.494140625, 40.90234375, 42.310546875, 43.71875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 6.0, 1.0, 6.0, 6.0, 8.0, 4.0, 12.0, 11.0, 13.0, 21.0, 16.0, 17.0, 28.0, 26.0, 24.0, 34.0, 30.0, 31.0, 39.0, 28.0, 35.0, 34.0, 34.0, 32.0, 41.0, 38.0, 34.0, 26.0, 50.0, 39.0, 28.0, 30.0, 31.0, 16.0, 31.0, 20.0, 17.0, 24.0, 18.0, 9.0, 11.0, 4.0, 9.0, 6.0, 7.0, 6.0, 4.0, 7.0, 1.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-75.9375, -73.5771484375, -71.216796875, -68.8564453125, -66.49609375, -64.1357421875, -61.775390625, -59.4150390625, -57.0546875, -54.6943359375, -52.333984375, -49.9736328125, -47.61328125, -45.2529296875, -42.892578125, -40.5322265625, -38.171875, -35.8115234375, -33.451171875, -31.0908203125, -28.73046875, -26.3701171875, -24.009765625, -21.6494140625, -19.2890625, -16.9287109375, -14.568359375, -12.2080078125, -9.84765625, -7.4873046875, -5.126953125, -2.7666015625, -0.40625, 1.9541015625, 4.314453125, 6.6748046875, 9.03515625, 11.3955078125, 13.755859375, 16.1162109375, 18.4765625, 20.8369140625, 23.197265625, 25.5576171875, 27.91796875, 30.2783203125, 32.638671875, 34.9990234375, 37.359375, 39.7197265625, 42.080078125, 44.4404296875, 46.80078125, 49.1611328125, 51.521484375, 53.8818359375, 56.2421875, 58.6025390625, 60.962890625, 63.3232421875, 65.68359375, 68.0439453125, 70.404296875, 72.7646484375, 75.125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 8.0, 12.0, 20.0, 17.0, 44.0, 62.0, 99.0, 124.0, 199.0, 288.0, 487.0, 764.0, 1161.0, 1823.0, 2939.0, 4639.0, 7383.0, 11888.0, 19460.0, 32459.0, 57143.0, 104841.0, 218764.0, 280493.0, 133170.0, 69972.0, 39406.0, 23290.0, 14111.0, 8580.0, 5447.0, 3502.0, 2146.0, 1403.0, 836.0, 555.0, 356.0, 205.0, 137.0, 94.0, 69.0, 47.0, 28.0, 18.0, 19.0, 16.0, 12.0, 3.0, 1.0, 3.0, 6.0, 3.0, 1.0], "bins": [-28.25, -27.42333984375, -26.5966796875, -25.77001953125, -24.943359375, -24.11669921875, -23.2900390625, -22.46337890625, -21.63671875, -20.81005859375, -19.9833984375, -19.15673828125, -18.330078125, -17.50341796875, -16.6767578125, -15.85009765625, -15.0234375, -14.19677734375, -13.3701171875, -12.54345703125, -11.716796875, -10.89013671875, -10.0634765625, -9.23681640625, -8.41015625, -7.58349609375, -6.7568359375, -5.93017578125, -5.103515625, -4.27685546875, -3.4501953125, -2.62353515625, -1.796875, -0.97021484375, -0.1435546875, 0.68310546875, 1.509765625, 2.33642578125, 3.1630859375, 3.98974609375, 4.81640625, 5.64306640625, 6.4697265625, 7.29638671875, 8.123046875, 8.94970703125, 9.7763671875, 10.60302734375, 11.4296875, 12.25634765625, 13.0830078125, 13.90966796875, 14.736328125, 15.56298828125, 16.3896484375, 17.21630859375, 18.04296875, 18.86962890625, 19.6962890625, 20.52294921875, 21.349609375, 22.17626953125, 23.0029296875, 23.82958984375, 24.65625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 1.0, 5.0, 5.0, 10.0, 9.0, 15.0, 12.0, 15.0, 17.0, 24.0, 18.0, 28.0, 23.0, 40.0, 36.0, 37.0, 25.0, 44.0, 53.0, 59.0, 42.0, 39.0, 40.0, 50.0, 20.0, 33.0, 43.0, 32.0, 24.0, 27.0, 35.0, 17.0, 13.0, 12.0, 16.0, 19.0, 17.0, 6.0, 12.0, 8.0, 6.0, 3.0, 3.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.90625, -50.18212890625, -48.4580078125, -46.73388671875, -45.009765625, -43.28564453125, -41.5615234375, -39.83740234375, -38.11328125, -36.38916015625, -34.6650390625, -32.94091796875, -31.216796875, -29.49267578125, -27.7685546875, -26.04443359375, -24.3203125, -22.59619140625, -20.8720703125, -19.14794921875, -17.423828125, -15.69970703125, -13.9755859375, -12.25146484375, -10.52734375, -8.80322265625, -7.0791015625, -5.35498046875, -3.630859375, -1.90673828125, -0.1826171875, 1.54150390625, 3.265625, 4.98974609375, 6.7138671875, 8.43798828125, 10.162109375, 11.88623046875, 13.6103515625, 15.33447265625, 17.05859375, 18.78271484375, 20.5068359375, 22.23095703125, 23.955078125, 25.67919921875, 27.4033203125, 29.12744140625, 30.8515625, 32.57568359375, 34.2998046875, 36.02392578125, 37.748046875, 39.47216796875, 41.1962890625, 42.92041015625, 44.64453125, 46.36865234375, 48.0927734375, 49.81689453125, 51.541015625, 53.26513671875, 54.9892578125, 56.71337890625, 58.4375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 9.0, 5.0, 11.0, 6.0, 10.0, 21.0, 21.0, 37.0, 74.0, 85.0, 116.0, 143.0, 219.0, 313.0, 525.0, 731.0, 1057.0, 1637.0, 2618.0, 4286.0, 7182.0, 12362.0, 23868.0, 50142.0, 132661.0, 522684.0, 167552.0, 58303.0, 27035.0, 14066.0, 7818.0, 4692.0, 2805.0, 1803.0, 1177.0, 756.0, 517.0, 341.0, 257.0, 171.0, 131.0, 72.0, 64.0, 38.0, 30.0, 28.0, 33.0, 17.0, 10.0, 9.0, 3.0, 5.0, 1.0, 2.0], "bins": [-8.9609375, -8.70916748046875, -8.4573974609375, -8.20562744140625, -7.953857421875, -7.70208740234375, -7.4503173828125, -7.19854736328125, -6.94677734375, -6.69500732421875, -6.4432373046875, -6.19146728515625, -5.939697265625, -5.68792724609375, -5.4361572265625, -5.18438720703125, -4.9326171875, -4.68084716796875, -4.4290771484375, -4.17730712890625, -3.925537109375, -3.67376708984375, -3.4219970703125, -3.17022705078125, -2.91845703125, -2.66668701171875, -2.4149169921875, -2.16314697265625, -1.911376953125, -1.65960693359375, -1.4078369140625, -1.15606689453125, -0.904296875, -0.65252685546875, -0.4007568359375, -0.14898681640625, 0.102783203125, 0.35455322265625, 0.6063232421875, 0.85809326171875, 1.10986328125, 1.36163330078125, 1.6134033203125, 1.86517333984375, 2.116943359375, 2.36871337890625, 2.6204833984375, 2.87225341796875, 3.1240234375, 3.37579345703125, 3.6275634765625, 3.87933349609375, 4.131103515625, 4.38287353515625, 4.6346435546875, 4.88641357421875, 5.13818359375, 5.38995361328125, 5.6417236328125, 5.89349365234375, 6.145263671875, 6.39703369140625, 6.6488037109375, 6.90057373046875, 7.15234375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 5.0, 2.0, 9.0, 8.0, 10.0, 13.0, 16.0, 15.0, 25.0, 34.0, 26.0, 35.0, 53.0, 47.0, 72.0, 80.0, 78.0, 73.0, 72.0, 64.0, 46.0, 34.0, 35.0, 31.0, 18.0, 13.0, 15.0, 7.0, 11.0, 9.0, 9.0, 8.0, 7.0, 5.0, 4.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016412734985351562, -0.001587405800819397, -0.0015335381031036377, -0.0014796704053878784, -0.0014258027076721191, -0.0013719350099563599, -0.0013180673122406006, -0.0012641996145248413, -0.001210331916809082, -0.0011564642190933228, -0.0011025965213775635, -0.0010487288236618042, -0.000994861125946045, -0.0009409934282302856, -0.0008871257305145264, -0.0008332580327987671, -0.0007793903350830078, -0.0007255226373672485, -0.0006716549396514893, -0.00061778724193573, -0.0005639195442199707, -0.0005100518465042114, -0.00045618414878845215, -0.00040231645107269287, -0.0003484487533569336, -0.0002945810556411743, -0.00024071335792541504, -0.00018684566020965576, -0.00013297796249389648, -7.911026477813721e-05, -2.524256706237793e-05, 2.8625130653381348e-05, 8.249282836914062e-05, 0.0001363605260848999, 0.00019022822380065918, 0.00024409592151641846, 0.00029796361923217773, 0.000351831316947937, 0.0004056990146636963, 0.00045956671237945557, 0.0005134344100952148, 0.0005673021078109741, 0.0006211698055267334, 0.0006750375032424927, 0.000728905200958252, 0.0007827728986740112, 0.0008366405963897705, 0.0008905082941055298, 0.0009443759918212891, 0.0009982436895370483, 0.0010521113872528076, 0.001105979084968567, 0.0011598467826843262, 0.0012137144804000854, 0.0012675821781158447, 0.001321449875831604, 0.0013753175735473633, 0.0014291852712631226, 0.0014830529689788818, 0.0015369206666946411, 0.0015907883644104004, 0.0016446560621261597, 0.001698523759841919, 0.0017523914575576782, 0.0018062591552734375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 9.0, 11.0, 15.0, 23.0, 35.0, 40.0, 57.0, 86.0, 130.0, 196.0, 297.0, 469.0, 739.0, 1133.0, 1876.0, 3235.0, 5543.0, 10321.0, 19116.0, 37827.0, 80860.0, 246468.0, 432102.0, 107609.0, 47255.0, 23956.0, 12478.0, 6858.0, 3820.0, 2258.0, 1313.0, 875.0, 519.0, 347.0, 199.0, 171.0, 94.0, 67.0, 46.0, 29.0, 25.0, 7.0, 15.0, 8.0, 5.0, 8.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-29.890625, -28.961181640625, -28.03173828125, -27.102294921875, -26.1728515625, -25.243408203125, -24.31396484375, -23.384521484375, -22.455078125, -21.525634765625, -20.59619140625, -19.666748046875, -18.7373046875, -17.807861328125, -16.87841796875, -15.948974609375, -15.01953125, -14.090087890625, -13.16064453125, -12.231201171875, -11.3017578125, -10.372314453125, -9.44287109375, -8.513427734375, -7.583984375, -6.654541015625, -5.72509765625, -4.795654296875, -3.8662109375, -2.936767578125, -2.00732421875, -1.077880859375, -0.1484375, 0.781005859375, 1.71044921875, 2.639892578125, 3.5693359375, 4.498779296875, 5.42822265625, 6.357666015625, 7.287109375, 8.216552734375, 9.14599609375, 10.075439453125, 11.0048828125, 11.934326171875, 12.86376953125, 13.793212890625, 14.72265625, 15.652099609375, 16.58154296875, 17.510986328125, 18.4404296875, 19.369873046875, 20.29931640625, 21.228759765625, 22.158203125, 23.087646484375, 24.01708984375, 24.946533203125, 25.8759765625, 26.805419921875, 27.73486328125, 28.664306640625, 29.59375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 2.0, 6.0, 5.0, 10.0, 7.0, 12.0, 17.0, 24.0, 16.0, 25.0, 22.0, 33.0, 27.0, 26.0, 43.0, 37.0, 39.0, 65.0, 66.0, 65.0, 76.0, 45.0, 41.0, 40.0, 43.0, 33.0, 24.0, 22.0, 21.0, 17.0, 18.0, 22.0, 13.0, 8.0, 8.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.28125, -6.08709716796875, -5.8929443359375, -5.69879150390625, -5.504638671875, -5.31048583984375, -5.1163330078125, -4.92218017578125, -4.72802734375, -4.53387451171875, -4.3397216796875, -4.14556884765625, -3.951416015625, -3.75726318359375, -3.5631103515625, -3.36895751953125, -3.1748046875, -2.98065185546875, -2.7864990234375, -2.59234619140625, -2.398193359375, -2.20404052734375, -2.0098876953125, -1.81573486328125, -1.62158203125, -1.42742919921875, -1.2332763671875, -1.03912353515625, -0.844970703125, -0.65081787109375, -0.4566650390625, -0.26251220703125, -0.068359375, 0.12579345703125, 0.3199462890625, 0.51409912109375, 0.708251953125, 0.90240478515625, 1.0965576171875, 1.29071044921875, 1.48486328125, 1.67901611328125, 1.8731689453125, 2.06732177734375, 2.261474609375, 2.45562744140625, 2.6497802734375, 2.84393310546875, 3.0380859375, 3.23223876953125, 3.4263916015625, 3.62054443359375, 3.814697265625, 4.00885009765625, 4.2030029296875, 4.39715576171875, 4.59130859375, 4.78546142578125, 4.9796142578125, 5.17376708984375, 5.367919921875, 5.56207275390625, 5.7562255859375, 5.95037841796875, 6.14453125]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 7.0, 19.0, 11.0, 10.0, 22.0, 32.0, 39.0, 47.0, 62.0, 63.0, 68.0, 90.0, 97.0, 94.0, 61.0, 51.0, 42.0, 49.0, 24.0, 12.0, 21.0, 11.0, 12.0, 6.0, 4.0, 5.0, 2.0, 8.0, 3.0, 7.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-109.68895721435547, -106.00871276855469, -102.3284683227539, -98.64822387695312, -94.96797943115234, -91.28773498535156, -87.60748291015625, -83.92723846435547, -80.24699401855469, -76.5667495727539, -72.88650512695312, -69.20626068115234, -65.52601623535156, -61.845767974853516, -58.165523529052734, -54.48527526855469, -50.80503463745117, -47.12479019165039, -43.44454574584961, -39.76429748535156, -36.08405303955078, -32.40380859375, -28.72356414794922, -25.043317794799805, -21.363073348999023, -17.682828903198242, -14.002582550048828, -10.322338104248047, -6.642092704772949, -2.9618473052978516, 0.7183971405029297, 4.398643493652344, 8.078887939453125, 11.759133338928223, 15.43937873840332, 19.1196231842041, 22.799869537353516, 26.480113983154297, 30.160358428955078, 33.840606689453125, 37.520851135253906, 41.20109558105469, 44.88134002685547, 48.56158447265625, 52.2418327331543, 55.92207717895508, 59.60232162475586, 63.282569885253906, 66.96281433105469, 70.64305877685547, 74.32330322265625, 78.00354766845703, 81.68379211425781, 85.36404418945312, 89.04428100585938, 92.72453308105469, 96.40476989746094, 100.08501434326172, 103.7652587890625, 107.44550323486328, 111.12574768066406, 114.80599975585938, 118.48623657226562, 122.16648864746094, 125.84673309326172]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 6.0, 3.0, 4.0, 8.0, 10.0, 15.0, 11.0, 18.0, 15.0, 25.0, 17.0, 23.0, 33.0, 35.0, 32.0, 44.0, 40.0, 37.0, 50.0, 35.0, 41.0, 43.0, 32.0, 38.0, 43.0, 35.0, 37.0, 30.0, 31.0, 36.0, 25.0, 26.0, 16.0, 17.0, 9.0, 18.0, 9.0, 9.0, 10.0, 8.0, 7.0, 3.0, 4.0, 3.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-84.2674331665039, -81.72209167480469, -79.17674255371094, -76.63140106201172, -74.0860595703125, -71.54071807861328, -68.99536895751953, -66.45002746582031, -63.904685974121094, -61.35934066772461, -58.81399917602539, -56.268653869628906, -53.72331237792969, -51.1779670715332, -48.63262176513672, -46.0872802734375, -43.541934967041016, -40.99658966064453, -38.45124816894531, -35.90590286254883, -33.36056137084961, -30.815216064453125, -28.269872665405273, -25.724529266357422, -23.17918586730957, -20.63384246826172, -18.088499069213867, -15.5431547164917, -12.997811317443848, -10.452467918395996, -7.907123565673828, -5.361780166625977, -2.816436767578125, -0.27109313011169434, 2.2742505073547363, 4.819594383239746, 7.364937782287598, 9.91028118133545, 12.455625534057617, 15.000968933105469, 17.54631233215332, 20.091655731201172, 22.636999130249023, 25.182342529296875, 27.72768783569336, 30.273029327392578, 32.81837463378906, 35.36371612548828, 37.909061431884766, 40.45440673828125, 42.99974822998047, 45.54509353637695, 48.09043502807617, 50.635780334472656, 53.181121826171875, 55.72646713256836, 58.271812438964844, 60.81715774536133, 63.36249923706055, 65.90784454345703, 68.45318603515625, 70.99852752685547, 73.54387664794922, 76.08921813964844, 78.63455963134766]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 7.0, 6.0, 14.0, 17.0, 20.0, 45.0, 55.0, 106.0, 196.0, 291.0, 444.0, 745.0, 1146.0, 1711.0, 2741.0, 4714.0, 7385.0, 12377.0, 20669.0, 36391.0, 68637.0, 135821.0, 251648.0, 235673.0, 123092.0, 61923.0, 33660.0, 19379.0, 11205.0, 6826.0, 4352.0, 2664.0, 1708.0, 1040.0, 686.0, 454.0, 250.0, 183.0, 107.0, 61.0, 34.0, 20.0, 18.0, 9.0, 8.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-162.75, -157.953125, -153.15625, -148.359375, -143.5625, -138.765625, -133.96875, -129.171875, -124.375, -119.578125, -114.78125, -109.984375, -105.1875, -100.390625, -95.59375, -90.796875, -86.0, -81.203125, -76.40625, -71.609375, -66.8125, -62.015625, -57.21875, -52.421875, -47.625, -42.828125, -38.03125, -33.234375, -28.4375, -23.640625, -18.84375, -14.046875, -9.25, -4.453125, 0.34375, 5.140625, 9.9375, 14.734375, 19.53125, 24.328125, 29.125, 33.921875, 38.71875, 43.515625, 48.3125, 53.109375, 57.90625, 62.703125, 67.5, 72.296875, 77.09375, 81.890625, 86.6875, 91.484375, 96.28125, 101.078125, 105.875, 110.671875, 115.46875, 120.265625, 125.0625, 129.859375, 134.65625, 139.453125, 144.25]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 6.0, 8.0, 9.0, 4.0, 8.0, 10.0, 13.0, 20.0, 14.0, 30.0, 17.0, 19.0, 33.0, 33.0, 23.0, 38.0, 38.0, 43.0, 33.0, 41.0, 44.0, 40.0, 40.0, 33.0, 33.0, 40.0, 44.0, 43.0, 17.0, 31.0, 25.0, 23.0, 18.0, 23.0, 18.0, 14.0, 11.0, 15.0, 9.0, 3.0, 10.0, 8.0, 4.0, 3.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-55.40625, -53.6494140625, -51.892578125, -50.1357421875, -48.37890625, -46.6220703125, -44.865234375, -43.1083984375, -41.3515625, -39.5947265625, -37.837890625, -36.0810546875, -34.32421875, -32.5673828125, -30.810546875, -29.0537109375, -27.296875, -25.5400390625, -23.783203125, -22.0263671875, -20.26953125, -18.5126953125, -16.755859375, -14.9990234375, -13.2421875, -11.4853515625, -9.728515625, -7.9716796875, -6.21484375, -4.4580078125, -2.701171875, -0.9443359375, 0.8125, 2.5693359375, 4.326171875, 6.0830078125, 7.83984375, 9.5966796875, 11.353515625, 13.1103515625, 14.8671875, 16.6240234375, 18.380859375, 20.1376953125, 21.89453125, 23.6513671875, 25.408203125, 27.1650390625, 28.921875, 30.6787109375, 32.435546875, 34.1923828125, 35.94921875, 37.7060546875, 39.462890625, 41.2197265625, 42.9765625, 44.7333984375, 46.490234375, 48.2470703125, 50.00390625, 51.7607421875, 53.517578125, 55.2744140625, 57.03125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 5.0, 7.0, 21.0, 26.0, 24.0, 49.0, 72.0, 120.0, 143.0, 222.0, 359.0, 523.0, 771.0, 1185.0, 1749.0, 2756.0, 4261.0, 6402.0, 9640.0, 15178.0, 23561.0, 38354.0, 64399.0, 112702.0, 196332.0, 225625.0, 139303.0, 79260.0, 46513.0, 28195.0, 17751.0, 11260.0, 7544.0, 4749.0, 3225.0, 2149.0, 1330.0, 918.0, 645.0, 396.0, 271.0, 180.0, 128.0, 85.0, 50.0, 39.0, 19.0, 20.0, 13.0, 12.0, 5.0, 6.0, 3.0, 2.0, 1.0], "bins": [-123.1875, -119.583984375, -115.98046875, -112.376953125, -108.7734375, -105.169921875, -101.56640625, -97.962890625, -94.359375, -90.755859375, -87.15234375, -83.548828125, -79.9453125, -76.341796875, -72.73828125, -69.134765625, -65.53125, -61.927734375, -58.32421875, -54.720703125, -51.1171875, -47.513671875, -43.91015625, -40.306640625, -36.703125, -33.099609375, -29.49609375, -25.892578125, -22.2890625, -18.685546875, -15.08203125, -11.478515625, -7.875, -4.271484375, -0.66796875, 2.935546875, 6.5390625, 10.142578125, 13.74609375, 17.349609375, 20.953125, 24.556640625, 28.16015625, 31.763671875, 35.3671875, 38.970703125, 42.57421875, 46.177734375, 49.78125, 53.384765625, 56.98828125, 60.591796875, 64.1953125, 67.798828125, 71.40234375, 75.005859375, 78.609375, 82.212890625, 85.81640625, 89.419921875, 93.0234375, 96.626953125, 100.23046875, 103.833984375, 107.4375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 7.0, 5.0, 10.0, 6.0, 13.0, 16.0, 14.0, 22.0, 20.0, 21.0, 20.0, 22.0, 28.0, 29.0, 18.0, 41.0, 38.0, 46.0, 39.0, 42.0, 45.0, 47.0, 32.0, 46.0, 39.0, 46.0, 35.0, 43.0, 29.0, 27.0, 24.0, 17.0, 20.0, 16.0, 18.0, 14.0, 11.0, 10.0, 11.0, 7.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-38.34375, -37.04052734375, -35.7373046875, -34.43408203125, -33.130859375, -31.82763671875, -30.5244140625, -29.22119140625, -27.91796875, -26.61474609375, -25.3115234375, -24.00830078125, -22.705078125, -21.40185546875, -20.0986328125, -18.79541015625, -17.4921875, -16.18896484375, -14.8857421875, -13.58251953125, -12.279296875, -10.97607421875, -9.6728515625, -8.36962890625, -7.06640625, -5.76318359375, -4.4599609375, -3.15673828125, -1.853515625, -0.55029296875, 0.7529296875, 2.05615234375, 3.359375, 4.66259765625, 5.9658203125, 7.26904296875, 8.572265625, 9.87548828125, 11.1787109375, 12.48193359375, 13.78515625, 15.08837890625, 16.3916015625, 17.69482421875, 18.998046875, 20.30126953125, 21.6044921875, 22.90771484375, 24.2109375, 25.51416015625, 26.8173828125, 28.12060546875, 29.423828125, 30.72705078125, 32.0302734375, 33.33349609375, 34.63671875, 35.93994140625, 37.2431640625, 38.54638671875, 39.849609375, 41.15283203125, 42.4560546875, 43.75927734375, 45.0625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 8.0, 18.0, 17.0, 27.0, 34.0, 38.0, 53.0, 72.0, 105.0, 128.0, 173.0, 228.0, 315.0, 455.0, 588.0, 926.0, 1286.0, 1865.0, 2937.0, 4602.0, 7992.0, 14377.0, 28653.0, 68730.0, 299123.0, 458780.0, 83938.0, 33408.0, 15910.0, 8562.0, 5123.0, 3207.0, 2085.0, 1354.0, 956.0, 639.0, 513.0, 371.0, 256.0, 178.0, 142.0, 106.0, 83.0, 43.0, 36.0, 28.0, 22.0, 19.0, 14.0, 14.0, 5.0, 8.0, 3.0, 4.0, 0.0, 1.0, 1.0], "bins": [-76.75, -74.3583984375, -71.966796875, -69.5751953125, -67.18359375, -64.7919921875, -62.400390625, -60.0087890625, -57.6171875, -55.2255859375, -52.833984375, -50.4423828125, -48.05078125, -45.6591796875, -43.267578125, -40.8759765625, -38.484375, -36.0927734375, -33.701171875, -31.3095703125, -28.91796875, -26.5263671875, -24.134765625, -21.7431640625, -19.3515625, -16.9599609375, -14.568359375, -12.1767578125, -9.78515625, -7.3935546875, -5.001953125, -2.6103515625, -0.21875, 2.1728515625, 4.564453125, 6.9560546875, 9.34765625, 11.7392578125, 14.130859375, 16.5224609375, 18.9140625, 21.3056640625, 23.697265625, 26.0888671875, 28.48046875, 30.8720703125, 33.263671875, 35.6552734375, 38.046875, 40.4384765625, 42.830078125, 45.2216796875, 47.61328125, 50.0048828125, 52.396484375, 54.7880859375, 57.1796875, 59.5712890625, 61.962890625, 64.3544921875, 66.74609375, 69.1376953125, 71.529296875, 73.9208984375, 76.3125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 4.0, 7.0, 9.0, 26.0, 26.0, 38.0, 53.0, 101.0, 132.0, 195.0, 129.0, 91.0, 54.0, 39.0, 26.0, 16.0, 8.0, 7.0, 9.0, 5.0, 5.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003662109375, -0.003498971462249756, -0.0033358335494995117, -0.0031726956367492676, -0.0030095577239990234, -0.0028464198112487793, -0.002683281898498535, -0.002520143985748291, -0.002357006072998047, -0.0021938681602478027, -0.0020307302474975586, -0.0018675923347473145, -0.0017044544219970703, -0.0015413165092468262, -0.001378178596496582, -0.0012150406837463379, -0.0010519027709960938, -0.0008887648582458496, -0.0007256269454956055, -0.0005624890327453613, -0.0003993511199951172, -0.00023621320724487305, -7.30752944946289e-05, 9.006261825561523e-05, 0.0002532005310058594, 0.0004163384437561035, 0.0005794763565063477, 0.0007426142692565918, 0.0009057521820068359, 0.00106889009475708, 0.0012320280075073242, 0.0013951659202575684, 0.0015583038330078125, 0.0017214417457580566, 0.0018845796585083008, 0.002047717571258545, 0.002210855484008789, 0.002373993396759033, 0.0025371313095092773, 0.0027002692222595215, 0.0028634071350097656, 0.0030265450477600098, 0.003189682960510254, 0.003352820873260498, 0.003515958786010742, 0.0036790966987609863, 0.0038422346115112305, 0.004005372524261475, 0.004168510437011719, 0.004331648349761963, 0.004494786262512207, 0.004657924175262451, 0.004821062088012695, 0.0049842000007629395, 0.005147337913513184, 0.005310475826263428, 0.005473613739013672, 0.005636751651763916, 0.00579988956451416, 0.005963027477264404, 0.0061261653900146484, 0.006289303302764893, 0.006452441215515137, 0.006615579128265381, 0.006778717041015625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 12.0, 9.0, 17.0, 38.0, 32.0, 50.0, 76.0, 104.0, 168.0, 263.0, 405.0, 539.0, 887.0, 1539.0, 2520.0, 4977.0, 10497.0, 27657.0, 105890.0, 708048.0, 129662.0, 31464.0, 11529.0, 5226.0, 2659.0, 1527.0, 900.0, 613.0, 416.0, 249.0, 180.0, 112.0, 87.0, 67.0, 39.0, 28.0, 25.0, 13.0, 11.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-128.375, -124.431640625, -120.48828125, -116.544921875, -112.6015625, -108.658203125, -104.71484375, -100.771484375, -96.828125, -92.884765625, -88.94140625, -84.998046875, -81.0546875, -77.111328125, -73.16796875, -69.224609375, -65.28125, -61.337890625, -57.39453125, -53.451171875, -49.5078125, -45.564453125, -41.62109375, -37.677734375, -33.734375, -29.791015625, -25.84765625, -21.904296875, -17.9609375, -14.017578125, -10.07421875, -6.130859375, -2.1875, 1.755859375, 5.69921875, 9.642578125, 13.5859375, 17.529296875, 21.47265625, 25.416015625, 29.359375, 33.302734375, 37.24609375, 41.189453125, 45.1328125, 49.076171875, 53.01953125, 56.962890625, 60.90625, 64.849609375, 68.79296875, 72.736328125, 76.6796875, 80.623046875, 84.56640625, 88.509765625, 92.453125, 96.396484375, 100.33984375, 104.283203125, 108.2265625, 112.169921875, 116.11328125, 120.056640625, 124.0]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 10.0, 2.0, 9.0, 13.0, 15.0, 20.0, 26.0, 46.0, 59.0, 71.0, 119.0, 157.0, 112.0, 79.0, 61.0, 48.0, 40.0, 17.0, 23.0, 12.0, 20.0, 5.0, 10.0, 5.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.125, -27.26123046875, -26.3974609375, -25.53369140625, -24.669921875, -23.80615234375, -22.9423828125, -22.07861328125, -21.21484375, -20.35107421875, -19.4873046875, -18.62353515625, -17.759765625, -16.89599609375, -16.0322265625, -15.16845703125, -14.3046875, -13.44091796875, -12.5771484375, -11.71337890625, -10.849609375, -9.98583984375, -9.1220703125, -8.25830078125, -7.39453125, -6.53076171875, -5.6669921875, -4.80322265625, -3.939453125, -3.07568359375, -2.2119140625, -1.34814453125, -0.484375, 0.37939453125, 1.2431640625, 2.10693359375, 2.970703125, 3.83447265625, 4.6982421875, 5.56201171875, 6.42578125, 7.28955078125, 8.1533203125, 9.01708984375, 9.880859375, 10.74462890625, 11.6083984375, 12.47216796875, 13.3359375, 14.19970703125, 15.0634765625, 15.92724609375, 16.791015625, 17.65478515625, 18.5185546875, 19.38232421875, 20.24609375, 21.10986328125, 21.9736328125, 22.83740234375, 23.701171875, 24.56494140625, 25.4287109375, 26.29248046875, 27.15625]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 5.0, 7.0, 10.0, 9.0, 15.0, 20.0, 26.0, 34.0, 39.0, 47.0, 73.0, 71.0, 79.0, 80.0, 70.0, 67.0, 58.0, 69.0, 39.0, 34.0, 22.0, 15.0, 20.0, 9.0, 15.0, 20.0, 5.0, 7.0, 7.0, 4.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-79.6473159790039, -76.89523315429688, -74.14314270019531, -71.39105224609375, -68.63896942138672, -65.88688659667969, -63.134796142578125, -60.38270950317383, -57.63062286376953, -54.878536224365234, -52.12644958496094, -49.37436294555664, -46.622276306152344, -43.87018966674805, -41.11810302734375, -38.36601638793945, -35.613929748535156, -32.86184310913086, -30.109756469726562, -27.357669830322266, -24.60558319091797, -21.853496551513672, -19.101409912109375, -16.349323272705078, -13.597236633300781, -10.845149993896484, -8.093063354492188, -5.340976715087891, -2.5888900756835938, 0.16319656372070312, 2.915283203125, 5.667369842529297, 8.419456481933594, 11.17154312133789, 13.923629760742188, 16.675716400146484, 19.42780303955078, 22.179889678955078, 24.931976318359375, 27.684062957763672, 30.43614959716797, 33.188236236572266, 35.94032287597656, 38.69240951538086, 41.444496154785156, 44.19658279418945, 46.94866943359375, 49.70075607299805, 52.452842712402344, 55.20492935180664, 57.95701599121094, 60.709102630615234, 63.46118927001953, 66.21327209472656, 68.96536254882812, 71.71745300292969, 74.46953582763672, 77.22161865234375, 79.97370910644531, 82.72579956054688, 85.4778823852539, 88.22996520996094, 90.9820556640625, 93.73414611816406, 96.4862289428711]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 5.0, 8.0, 6.0, 11.0, 6.0, 15.0, 12.0, 18.0, 23.0, 15.0, 20.0, 24.0, 22.0, 37.0, 37.0, 29.0, 34.0, 36.0, 45.0, 44.0, 42.0, 41.0, 32.0, 52.0, 42.0, 49.0, 28.0, 31.0, 28.0, 37.0, 26.0, 18.0, 22.0, 23.0, 10.0, 11.0, 15.0, 18.0, 8.0, 7.0, 4.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-74.65203857421875, -72.5244140625, -70.39678192138672, -68.26915740966797, -66.14152526855469, -64.01390075683594, -61.88627243041992, -59.758644104003906, -57.63101577758789, -55.503387451171875, -53.37575912475586, -51.248130798339844, -49.120506286621094, -46.99287414550781, -44.86524963378906, -42.73762130737305, -40.60999298095703, -38.482364654541016, -36.354736328125, -34.227108001708984, -32.09947967529297, -29.971853256225586, -27.844226837158203, -25.716598510742188, -23.588970184326172, -21.461341857910156, -19.33371353149414, -17.206087112426758, -15.078458786010742, -12.950830459594727, -10.823203086853027, -8.695575714111328, -6.567955017089844, -4.440327167510986, -2.312699317932129, -0.18507146835327148, 1.942556381225586, 4.070184707641602, 6.197812080383301, 8.325439453125, 10.453067779541016, 12.580696105957031, 14.70832347869873, 16.83595085144043, 18.963579177856445, 21.09120750427246, 23.218833923339844, 25.34646224975586, 27.474090576171875, 29.60171890258789, 31.729347229003906, 33.85697555541992, 35.98460388183594, 38.11222839355469, 40.2398567199707, 42.36748504638672, 44.495113372802734, 46.62274169921875, 48.750370025634766, 50.87799835205078, 53.00562286376953, 55.13325500488281, 57.26087951660156, 59.38850784301758, 61.516136169433594]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 10.0, 6.0, 12.0, 14.0, 30.0, 37.0, 58.0, 82.0, 119.0, 167.0, 255.0, 418.0, 621.0, 973.0, 1552.0, 2275.0, 3812.0, 6229.0, 10023.0, 16556.0, 27803.0, 48328.0, 87990.0, 179934.0, 650402.0, 1910222.0, 813966.0, 210543.0, 97677.0, 51905.0, 29032.0, 16930.0, 10218.0, 6022.0, 3818.0, 2338.0, 1462.0, 918.0, 526.0, 367.0, 223.0, 150.0, 83.0, 77.0, 44.0, 33.0, 14.0, 4.0, 8.0, 4.0, 3.0, 0.0, 2.0], "bins": [-105.875, -102.9794921875, -100.083984375, -97.1884765625, -94.29296875, -91.3974609375, -88.501953125, -85.6064453125, -82.7109375, -79.8154296875, -76.919921875, -74.0244140625, -71.12890625, -68.2333984375, -65.337890625, -62.4423828125, -59.546875, -56.6513671875, -53.755859375, -50.8603515625, -47.96484375, -45.0693359375, -42.173828125, -39.2783203125, -36.3828125, -33.4873046875, -30.591796875, -27.6962890625, -24.80078125, -21.9052734375, -19.009765625, -16.1142578125, -13.21875, -10.3232421875, -7.427734375, -4.5322265625, -1.63671875, 1.2587890625, 4.154296875, 7.0498046875, 9.9453125, 12.8408203125, 15.736328125, 18.6318359375, 21.52734375, 24.4228515625, 27.318359375, 30.2138671875, 33.109375, 36.0048828125, 38.900390625, 41.7958984375, 44.69140625, 47.5869140625, 50.482421875, 53.3779296875, 56.2734375, 59.1689453125, 62.064453125, 64.9599609375, 67.85546875, 70.7509765625, 73.646484375, 76.5419921875, 79.4375]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 6.0, 7.0, 12.0, 11.0, 14.0, 15.0, 22.0, 15.0, 32.0, 15.0, 22.0, 15.0, 32.0, 32.0, 40.0, 34.0, 42.0, 35.0, 34.0, 37.0, 46.0, 46.0, 45.0, 33.0, 38.0, 38.0, 37.0, 27.0, 29.0, 21.0, 25.0, 23.0, 16.0, 14.0, 13.0, 16.0, 11.0, 9.0, 9.0, 7.0, 6.0, 5.0, 2.0, 4.0, 3.0, 5.0, 2.0, 0.0, 1.0], "bins": [-39.75, -38.62060546875, -37.4912109375, -36.36181640625, -35.232421875, -34.10302734375, -32.9736328125, -31.84423828125, -30.71484375, -29.58544921875, -28.4560546875, -27.32666015625, -26.197265625, -25.06787109375, -23.9384765625, -22.80908203125, -21.6796875, -20.55029296875, -19.4208984375, -18.29150390625, -17.162109375, -16.03271484375, -14.9033203125, -13.77392578125, -12.64453125, -11.51513671875, -10.3857421875, -9.25634765625, -8.126953125, -6.99755859375, -5.8681640625, -4.73876953125, -3.609375, -2.47998046875, -1.3505859375, -0.22119140625, 0.908203125, 2.03759765625, 3.1669921875, 4.29638671875, 5.42578125, 6.55517578125, 7.6845703125, 8.81396484375, 9.943359375, 11.07275390625, 12.2021484375, 13.33154296875, 14.4609375, 15.59033203125, 16.7197265625, 17.84912109375, 18.978515625, 20.10791015625, 21.2373046875, 22.36669921875, 23.49609375, 24.62548828125, 25.7548828125, 26.88427734375, 28.013671875, 29.14306640625, 30.2724609375, 31.40185546875, 32.53125]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 7.0, 5.0, 15.0, 11.0, 26.0, 31.0, 60.0, 88.0, 114.0, 196.0, 285.0, 421.0, 672.0, 1053.0, 1650.0, 2671.0, 4570.0, 7579.0, 12994.0, 24028.0, 44672.0, 88575.0, 190105.0, 474734.0, 1695397.0, 1026762.0, 327057.0, 140849.0, 68439.0, 35074.0, 19072.0, 10743.0, 6232.0, 3788.0, 2289.0, 1408.0, 919.0, 586.0, 376.0, 241.0, 163.0, 114.0, 76.0, 57.0, 31.0, 20.0, 12.0, 9.0, 8.0, 4.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.875, -75.34765625, -72.8203125, -70.29296875, -67.765625, -65.23828125, -62.7109375, -60.18359375, -57.65625, -55.12890625, -52.6015625, -50.07421875, -47.546875, -45.01953125, -42.4921875, -39.96484375, -37.4375, -34.91015625, -32.3828125, -29.85546875, -27.328125, -24.80078125, -22.2734375, -19.74609375, -17.21875, -14.69140625, -12.1640625, -9.63671875, -7.109375, -4.58203125, -2.0546875, 0.47265625, 3.0, 5.52734375, 8.0546875, 10.58203125, 13.109375, 15.63671875, 18.1640625, 20.69140625, 23.21875, 25.74609375, 28.2734375, 30.80078125, 33.328125, 35.85546875, 38.3828125, 40.91015625, 43.4375, 45.96484375, 48.4921875, 51.01953125, 53.546875, 56.07421875, 58.6015625, 61.12890625, 63.65625, 66.18359375, 68.7109375, 71.23828125, 73.765625, 76.29296875, 78.8203125, 81.34765625, 83.875]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 6.0, 4.0, 7.0, 9.0, 11.0, 10.0, 14.0, 26.0, 45.0, 38.0, 36.0, 58.0, 60.0, 78.0, 101.0, 117.0, 155.0, 206.0, 285.0, 422.0, 465.0, 431.0, 327.0, 225.0, 189.0, 146.0, 129.0, 100.0, 82.0, 58.0, 42.0, 43.0, 36.0, 28.0, 21.0, 18.0, 8.0, 9.0, 6.0, 6.0, 11.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.703125, -19.958740234375, -19.21435546875, -18.469970703125, -17.7255859375, -16.981201171875, -16.23681640625, -15.492431640625, -14.748046875, -14.003662109375, -13.25927734375, -12.514892578125, -11.7705078125, -11.026123046875, -10.28173828125, -9.537353515625, -8.79296875, -8.048583984375, -7.30419921875, -6.559814453125, -5.8154296875, -5.071044921875, -4.32666015625, -3.582275390625, -2.837890625, -2.093505859375, -1.34912109375, -0.604736328125, 0.1396484375, 0.884033203125, 1.62841796875, 2.372802734375, 3.1171875, 3.861572265625, 4.60595703125, 5.350341796875, 6.0947265625, 6.839111328125, 7.58349609375, 8.327880859375, 9.072265625, 9.816650390625, 10.56103515625, 11.305419921875, 12.0498046875, 12.794189453125, 13.53857421875, 14.282958984375, 15.02734375, 15.771728515625, 16.51611328125, 17.260498046875, 18.0048828125, 18.749267578125, 19.49365234375, 20.238037109375, 20.982421875, 21.726806640625, 22.47119140625, 23.215576171875, 23.9599609375, 24.704345703125, 25.44873046875, 26.193115234375, 26.9375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 2.0, 10.0, 4.0, 5.0, 12.0, 19.0, 17.0, 22.0, 26.0, 28.0, 34.0, 41.0, 50.0, 58.0, 70.0, 93.0, 99.0, 74.0, 63.0, 60.0, 37.0, 28.0, 30.0, 18.0, 22.0, 16.0, 9.0, 8.0, 9.0, 6.0, 6.0, 1.0, 4.0, 3.0, 7.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-55.53485107421875, -53.789913177490234, -52.04497528076172, -50.30003356933594, -48.55509567260742, -46.810157775878906, -45.065216064453125, -43.32027816772461, -41.575340270996094, -39.83040237426758, -38.08546447753906, -36.34052276611328, -34.595584869384766, -32.85064697265625, -31.1057071685791, -29.360767364501953, -27.615829467773438, -25.870891571044922, -24.125951766967773, -22.381011962890625, -20.63607406616211, -18.891136169433594, -17.146196365356445, -15.401257514953613, -13.656318664550781, -11.91137981414795, -10.166440963745117, -8.421502113342285, -6.676563262939453, -4.931624412536621, -3.186685562133789, -1.441746711730957, 0.3031883239746094, 2.0481271743774414, 3.7930660247802734, 5.5380048751831055, 7.2829437255859375, 9.02788257598877, 10.772821426391602, 12.517760276794434, 14.262699127197266, 16.00763702392578, 17.75257682800293, 19.497516632080078, 21.242454528808594, 22.98739242553711, 24.732332229614258, 26.477272033691406, 28.222209930419922, 29.967147827148438, 31.712087631225586, 33.457027435302734, 35.20196533203125, 36.946903228759766, 38.69184112548828, 40.43678283691406, 42.18172073364258, 43.926658630371094, 45.671600341796875, 47.41653823852539, 49.161476135253906, 50.90641403198242, 52.65135192871094, 54.39629364013672, 56.141231536865234]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 1.0, 6.0, 10.0, 10.0, 12.0, 14.0, 19.0, 15.0, 16.0, 19.0, 24.0, 20.0, 26.0, 36.0, 29.0, 46.0, 32.0, 32.0, 40.0, 43.0, 43.0, 40.0, 48.0, 39.0, 34.0, 31.0, 28.0, 33.0, 38.0, 32.0, 23.0, 18.0, 18.0, 26.0, 21.0, 16.0, 15.0, 14.0, 6.0, 7.0, 3.0, 3.0, 8.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-48.078182220458984, -46.74728012084961, -45.41637420654297, -44.085472106933594, -42.75457000732422, -41.423667907714844, -40.0927619934082, -38.76185989379883, -37.43095397949219, -36.10005187988281, -34.76914596557617, -33.4382438659668, -32.10734176635742, -30.776437759399414, -29.445533752441406, -28.11463165283203, -26.783729553222656, -25.45282554626465, -24.121923446655273, -22.791019439697266, -21.46011734008789, -20.129213333129883, -18.798309326171875, -17.4674072265625, -16.136503219604492, -14.8056001663208, -13.47469711303711, -12.143793106079102, -10.81289005279541, -9.481986999511719, -8.151082992553711, -6.8201799392700195, -5.489280700683594, -4.158377647399902, -2.8274741172790527, -1.4965708255767822, -0.16566753387451172, 1.1652355194091797, 2.4961390495300293, 3.827042579650879, 5.15794563293457, 6.488848686218262, 7.819752216339111, 9.150655746459961, 10.481558799743652, 11.812461853027344, 13.143365859985352, 14.474268913269043, 15.805171966552734, 17.136075973510742, 18.466978073120117, 19.797882080078125, 21.1287841796875, 22.459688186645508, 23.790592193603516, 25.12149429321289, 26.4523983001709, 27.783302307128906, 29.11420440673828, 30.44510841369629, 31.776012420654297, 33.10691452026367, 34.43781661987305, 35.76872253417969, 37.09962463378906]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 6.0, 2.0, 7.0, 8.0, 14.0, 15.0, 26.0, 51.0, 79.0, 88.0, 142.0, 222.0, 347.0, 476.0, 661.0, 1117.0, 1791.0, 2643.0, 4159.0, 6505.0, 10340.0, 16123.0, 25642.0, 42690.0, 70992.0, 121506.0, 208253.0, 215533.0, 127284.0, 74090.0, 44538.0, 27468.0, 16592.0, 10342.0, 6571.0, 4206.0, 2734.0, 1795.0, 1169.0, 763.0, 518.0, 343.0, 238.0, 151.0, 114.0, 67.0, 34.0, 33.0, 24.0, 15.0, 11.0, 8.0, 9.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-18.578125, -17.998291015625, -17.41845703125, -16.838623046875, -16.2587890625, -15.678955078125, -15.09912109375, -14.519287109375, -13.939453125, -13.359619140625, -12.77978515625, -12.199951171875, -11.6201171875, -11.040283203125, -10.46044921875, -9.880615234375, -9.30078125, -8.720947265625, -8.14111328125, -7.561279296875, -6.9814453125, -6.401611328125, -5.82177734375, -5.241943359375, -4.662109375, -4.082275390625, -3.50244140625, -2.922607421875, -2.3427734375, -1.762939453125, -1.18310546875, -0.603271484375, -0.0234375, 0.556396484375, 1.13623046875, 1.716064453125, 2.2958984375, 2.875732421875, 3.45556640625, 4.035400390625, 4.615234375, 5.195068359375, 5.77490234375, 6.354736328125, 6.9345703125, 7.514404296875, 8.09423828125, 8.674072265625, 9.25390625, 9.833740234375, 10.41357421875, 10.993408203125, 11.5732421875, 12.153076171875, 12.73291015625, 13.312744140625, 13.892578125, 14.472412109375, 15.05224609375, 15.632080078125, 16.2119140625, 16.791748046875, 17.37158203125, 17.951416015625, 18.53125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 5.0, 4.0, 5.0, 4.0, 11.0, 13.0, 10.0, 19.0, 13.0, 18.0, 20.0, 16.0, 21.0, 36.0, 33.0, 39.0, 31.0, 40.0, 37.0, 27.0, 40.0, 27.0, 44.0, 30.0, 43.0, 38.0, 32.0, 30.0, 39.0, 40.0, 31.0, 22.0, 23.0, 18.0, 24.0, 20.0, 25.0, 10.0, 9.0, 9.0, 13.0, 8.0, 9.0, 5.0, 4.0, 5.0, 2.0, 3.0, 3.0, 1.0], "bins": [-46.28125, -45.01220703125, -43.7431640625, -42.47412109375, -41.205078125, -39.93603515625, -38.6669921875, -37.39794921875, -36.12890625, -34.85986328125, -33.5908203125, -32.32177734375, -31.052734375, -29.78369140625, -28.5146484375, -27.24560546875, -25.9765625, -24.70751953125, -23.4384765625, -22.16943359375, -20.900390625, -19.63134765625, -18.3623046875, -17.09326171875, -15.82421875, -14.55517578125, -13.2861328125, -12.01708984375, -10.748046875, -9.47900390625, -8.2099609375, -6.94091796875, -5.671875, -4.40283203125, -3.1337890625, -1.86474609375, -0.595703125, 0.67333984375, 1.9423828125, 3.21142578125, 4.48046875, 5.74951171875, 7.0185546875, 8.28759765625, 9.556640625, 10.82568359375, 12.0947265625, 13.36376953125, 14.6328125, 15.90185546875, 17.1708984375, 18.43994140625, 19.708984375, 20.97802734375, 22.2470703125, 23.51611328125, 24.78515625, 26.05419921875, 27.3232421875, 28.59228515625, 29.861328125, 31.13037109375, 32.3994140625, 33.66845703125, 34.9375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 13.0, 15.0, 30.0, 29.0, 42.0, 80.0, 96.0, 214.0, 346.0, 635.0, 1022.0, 1757.0, 3047.0, 5288.0, 9911.0, 17961.0, 34117.0, 67352.0, 146232.0, 348747.0, 218991.0, 93976.0, 45741.0, 23707.0, 12798.0, 7004.0, 4015.0, 2265.0, 1233.0, 752.0, 463.0, 274.0, 153.0, 74.0, 71.0, 30.0, 25.0, 24.0, 10.0, 4.0, 2.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.453125, -15.9503173828125, -15.447509765625, -14.9447021484375, -14.44189453125, -13.9390869140625, -13.436279296875, -12.9334716796875, -12.4306640625, -11.9278564453125, -11.425048828125, -10.9222412109375, -10.41943359375, -9.9166259765625, -9.413818359375, -8.9110107421875, -8.408203125, -7.9053955078125, -7.402587890625, -6.8997802734375, -6.39697265625, -5.8941650390625, -5.391357421875, -4.8885498046875, -4.3857421875, -3.8829345703125, -3.380126953125, -2.8773193359375, -2.37451171875, -1.8717041015625, -1.368896484375, -0.8660888671875, -0.36328125, 0.1395263671875, 0.642333984375, 1.1451416015625, 1.64794921875, 2.1507568359375, 2.653564453125, 3.1563720703125, 3.6591796875, 4.1619873046875, 4.664794921875, 5.1676025390625, 5.67041015625, 6.1732177734375, 6.676025390625, 7.1788330078125, 7.681640625, 8.1844482421875, 8.687255859375, 9.1900634765625, 9.69287109375, 10.1956787109375, 10.698486328125, 11.2012939453125, 11.7041015625, 12.2069091796875, 12.709716796875, 13.2125244140625, 13.71533203125, 14.2181396484375, 14.720947265625, 15.2237548828125, 15.7265625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 5.0, 8.0, 6.0, 12.0, 12.0, 11.0, 17.0, 22.0, 22.0, 22.0, 33.0, 34.0, 27.0, 30.0, 39.0, 43.0, 57.0, 57.0, 43.0, 47.0, 61.0, 37.0, 37.0, 41.0, 42.0, 28.0, 33.0, 37.0, 28.0, 22.0, 24.0, 10.0, 14.0, 15.0, 8.0, 7.0, 2.0, 4.0, 4.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.703125, -29.724365234375, -28.74560546875, -27.766845703125, -26.7880859375, -25.809326171875, -24.83056640625, -23.851806640625, -22.873046875, -21.894287109375, -20.91552734375, -19.936767578125, -18.9580078125, -17.979248046875, -17.00048828125, -16.021728515625, -15.04296875, -14.064208984375, -13.08544921875, -12.106689453125, -11.1279296875, -10.149169921875, -9.17041015625, -8.191650390625, -7.212890625, -6.234130859375, -5.25537109375, -4.276611328125, -3.2978515625, -2.319091796875, -1.34033203125, -0.361572265625, 0.6171875, 1.595947265625, 2.57470703125, 3.553466796875, 4.5322265625, 5.510986328125, 6.48974609375, 7.468505859375, 8.447265625, 9.426025390625, 10.40478515625, 11.383544921875, 12.3623046875, 13.341064453125, 14.31982421875, 15.298583984375, 16.27734375, 17.256103515625, 18.23486328125, 19.213623046875, 20.1923828125, 21.171142578125, 22.14990234375, 23.128662109375, 24.107421875, 25.086181640625, 26.06494140625, 27.043701171875, 28.0224609375, 29.001220703125, 29.97998046875, 30.958740234375, 31.9375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 5.0, 9.0, 6.0, 9.0, 12.0, 21.0, 30.0, 49.0, 51.0, 61.0, 151.0, 171.0, 272.0, 368.0, 542.0, 812.0, 1199.0, 1797.0, 2943.0, 4603.0, 8093.0, 14452.0, 27630.0, 61056.0, 178489.0, 515207.0, 128083.0, 48473.0, 23240.0, 12072.0, 6894.0, 4209.0, 2582.0, 1587.0, 1060.0, 708.0, 470.0, 316.0, 227.0, 178.0, 99.0, 83.0, 61.0, 52.0, 38.0, 24.0, 26.0, 12.0, 2.0, 10.0, 9.0, 4.0, 3.0, 4.0], "bins": [-7.13671875, -6.9349365234375, -6.733154296875, -6.5313720703125, -6.32958984375, -6.1278076171875, -5.926025390625, -5.7242431640625, -5.5224609375, -5.3206787109375, -5.118896484375, -4.9171142578125, -4.71533203125, -4.5135498046875, -4.311767578125, -4.1099853515625, -3.908203125, -3.7064208984375, -3.504638671875, -3.3028564453125, -3.10107421875, -2.8992919921875, -2.697509765625, -2.4957275390625, -2.2939453125, -2.0921630859375, -1.890380859375, -1.6885986328125, -1.48681640625, -1.2850341796875, -1.083251953125, -0.8814697265625, -0.6796875, -0.4779052734375, -0.276123046875, -0.0743408203125, 0.12744140625, 0.3292236328125, 0.531005859375, 0.7327880859375, 0.9345703125, 1.1363525390625, 1.338134765625, 1.5399169921875, 1.74169921875, 1.9434814453125, 2.145263671875, 2.3470458984375, 2.548828125, 2.7506103515625, 2.952392578125, 3.1541748046875, 3.35595703125, 3.5577392578125, 3.759521484375, 3.9613037109375, 4.1630859375, 4.3648681640625, 4.566650390625, 4.7684326171875, 4.97021484375, 5.1719970703125, 5.373779296875, 5.5755615234375, 5.77734375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 8.0, 2.0, 8.0, 4.0, 10.0, 9.0, 10.0, 13.0, 14.0, 32.0, 19.0, 31.0, 30.0, 38.0, 40.0, 49.0, 52.0, 61.0, 66.0, 46.0, 66.0, 63.0, 49.0, 43.0, 41.0, 30.0, 27.0, 25.0, 19.0, 15.0, 16.0, 9.0, 9.0, 9.0, 3.0, 4.0, 6.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0008144378662109375, -0.0007896125316619873, -0.0007647871971130371, -0.0007399618625640869, -0.0007151365280151367, -0.0006903111934661865, -0.0006654858589172363, -0.0006406605243682861, -0.0006158351898193359, -0.0005910098552703857, -0.0005661845207214355, -0.0005413591861724854, -0.0005165338516235352, -0.000491708517074585, -0.00046688318252563477, -0.00044205784797668457, -0.0004172325134277344, -0.0003924071788787842, -0.000367581844329834, -0.0003427565097808838, -0.0003179311752319336, -0.0002931058406829834, -0.0002682805061340332, -0.000243455171585083, -0.0002186298370361328, -0.00019380450248718262, -0.00016897916793823242, -0.00014415383338928223, -0.00011932849884033203, -9.450316429138184e-05, -6.967782974243164e-05, -4.4852495193481445e-05, -2.002716064453125e-05, 4.798173904418945e-06, 2.962350845336914e-05, 5.4448843002319336e-05, 7.927417755126953e-05, 0.00010409951210021973, 0.00012892484664916992, 0.00015375018119812012, 0.0001785755157470703, 0.0002034008502960205, 0.0002282261848449707, 0.0002530515193939209, 0.0002778768539428711, 0.0003027021884918213, 0.0003275275230407715, 0.0003523528575897217, 0.0003771781921386719, 0.00040200352668762207, 0.00042682886123657227, 0.00045165419578552246, 0.00047647953033447266, 0.0005013048648834229, 0.000526130199432373, 0.0005509555339813232, 0.0005757808685302734, 0.0006006062030792236, 0.0006254315376281738, 0.000650256872177124, 0.0006750822067260742, 0.0006999075412750244, 0.0007247328758239746, 0.0007495582103729248, 0.000774383544921875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 7.0, 9.0, 10.0, 16.0, 22.0, 28.0, 27.0, 64.0, 89.0, 106.0, 181.0, 294.0, 431.0, 688.0, 1112.0, 1959.0, 3404.0, 6202.0, 12270.0, 25094.0, 54972.0, 132755.0, 458501.0, 203330.0, 78071.0, 34067.0, 16221.0, 8180.0, 4279.0, 2389.0, 1374.0, 868.0, 535.0, 337.0, 195.0, 131.0, 90.0, 78.0, 50.0, 28.0, 34.0, 20.0, 9.0, 11.0, 5.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-25.421875, -24.64453125, -23.8671875, -23.08984375, -22.3125, -21.53515625, -20.7578125, -19.98046875, -19.203125, -18.42578125, -17.6484375, -16.87109375, -16.09375, -15.31640625, -14.5390625, -13.76171875, -12.984375, -12.20703125, -11.4296875, -10.65234375, -9.875, -9.09765625, -8.3203125, -7.54296875, -6.765625, -5.98828125, -5.2109375, -4.43359375, -3.65625, -2.87890625, -2.1015625, -1.32421875, -0.546875, 0.23046875, 1.0078125, 1.78515625, 2.5625, 3.33984375, 4.1171875, 4.89453125, 5.671875, 6.44921875, 7.2265625, 8.00390625, 8.78125, 9.55859375, 10.3359375, 11.11328125, 11.890625, 12.66796875, 13.4453125, 14.22265625, 15.0, 15.77734375, 16.5546875, 17.33203125, 18.109375, 18.88671875, 19.6640625, 20.44140625, 21.21875, 21.99609375, 22.7734375, 23.55078125, 24.328125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 13.0, 13.0, 16.0, 15.0, 22.0, 33.0, 51.0, 59.0, 47.0, 46.0, 50.0, 61.0, 61.0, 76.0, 48.0, 59.0, 66.0, 50.0, 39.0, 44.0, 29.0, 29.0, 18.0, 16.0, 10.0, 10.0, 5.0, 1.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.15625, -6.95013427734375, -6.7440185546875, -6.53790283203125, -6.331787109375, -6.12567138671875, -5.9195556640625, -5.71343994140625, -5.50732421875, -5.30120849609375, -5.0950927734375, -4.88897705078125, -4.682861328125, -4.47674560546875, -4.2706298828125, -4.06451416015625, -3.8583984375, -3.65228271484375, -3.4461669921875, -3.24005126953125, -3.033935546875, -2.82781982421875, -2.6217041015625, -2.41558837890625, -2.20947265625, -2.00335693359375, -1.7972412109375, -1.59112548828125, -1.385009765625, -1.17889404296875, -0.9727783203125, -0.76666259765625, -0.560546875, -0.35443115234375, -0.1483154296875, 0.05780029296875, 0.263916015625, 0.47003173828125, 0.6761474609375, 0.88226318359375, 1.08837890625, 1.29449462890625, 1.5006103515625, 1.70672607421875, 1.912841796875, 2.11895751953125, 2.3250732421875, 2.53118896484375, 2.7373046875, 2.94342041015625, 3.1495361328125, 3.35565185546875, 3.561767578125, 3.76788330078125, 3.9739990234375, 4.18011474609375, 4.38623046875, 4.59234619140625, 4.7984619140625, 5.00457763671875, 5.210693359375, 5.41680908203125, 5.6229248046875, 5.82904052734375, 6.03515625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 2.0, 1.0, 2.0, 5.0, 0.0, 3.0, 4.0, 3.0, 7.0, 12.0, 11.0, 14.0, 12.0, 16.0, 26.0, 37.0, 31.0, 35.0, 37.0, 46.0, 60.0, 72.0, 95.0, 73.0, 67.0, 64.0, 46.0, 42.0, 23.0, 32.0, 18.0, 19.0, 23.0, 6.0, 7.0, 11.0, 6.0, 4.0, 8.0, 3.0, 3.0, 0.0, 3.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-49.464019775390625, -47.83659744262695, -46.20917510986328, -44.58175277709961, -42.95433044433594, -41.326908111572266, -39.699485778808594, -38.07206726074219, -36.44464111328125, -34.81721878051758, -33.189796447753906, -31.562374114990234, -29.934951782226562, -28.30752944946289, -26.68010902404785, -25.05268669128418, -23.42526626586914, -21.79784393310547, -20.170421600341797, -18.542999267578125, -16.915576934814453, -15.288155555725098, -13.660734176635742, -12.03331184387207, -10.405889511108398, -8.778467178344727, -7.151045322418213, -5.523623466491699, -3.8962011337280273, -2.2687788009643555, -0.641357421875, 0.9860649108886719, 2.6134910583496094, 4.240913391113281, 5.868335247039795, 7.495757102966309, 9.12317943572998, 10.750601768493652, 12.378023147583008, 14.00544548034668, 15.632867813110352, 17.260290145874023, 18.887712478637695, 20.515132904052734, 22.142555236816406, 23.769977569580078, 25.39739990234375, 27.024822235107422, 28.652244567871094, 30.279666900634766, 31.907089233398438, 33.53451156616211, 35.16193389892578, 36.78935623168945, 38.416778564453125, 40.04419708251953, 41.67162322998047, 43.29904556274414, 44.92646789550781, 46.553890228271484, 48.181312561035156, 49.80873489379883, 51.4361572265625, 53.063575744628906, 54.69099807739258]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 6.0, 11.0, 14.0, 17.0, 15.0, 18.0, 26.0, 19.0, 21.0, 32.0, 27.0, 31.0, 35.0, 37.0, 29.0, 52.0, 43.0, 36.0, 41.0, 42.0, 37.0, 35.0, 42.0, 26.0, 31.0, 43.0, 34.0, 27.0, 21.0, 17.0, 21.0, 24.0, 20.0, 11.0, 7.0, 14.0, 12.0, 9.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.97496795654297, -50.50768280029297, -49.040401458740234, -47.573116302490234, -46.1058349609375, -44.6385498046875, -43.1712646484375, -41.703983306884766, -40.23670196533203, -38.76941680908203, -37.3021354675293, -35.8348503112793, -34.36756896972656, -32.90028381347656, -31.433000564575195, -29.965717315673828, -28.498432159423828, -27.03114891052246, -25.563865661621094, -24.096580505371094, -22.62929916381836, -21.16201400756836, -19.694730758666992, -18.227447509765625, -16.760164260864258, -15.29288101196289, -13.825597763061523, -12.35831356048584, -10.891030311584473, -9.423747062683105, -7.956462860107422, -6.489179611206055, -5.021892547607422, -3.5546090602874756, -2.0873255729675293, -0.6200418472290039, 0.8472414016723633, 2.3145246505737305, 3.781808853149414, 5.249092102050781, 6.716375350952148, 8.183658599853516, 9.650941848754883, 11.118226051330566, 12.585509300231934, 14.0527925491333, 15.520076751708984, 16.98736000061035, 18.45464324951172, 19.921926498413086, 21.389209747314453, 22.856494903564453, 24.323776245117188, 25.791061401367188, 27.258344650268555, 28.725627899169922, 30.19291114807129, 31.660194396972656, 33.127479553222656, 34.59476089477539, 36.06204605102539, 37.529327392578125, 38.996612548828125, 40.463897705078125, 41.93117904663086]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 9.0, 8.0, 19.0, 22.0, 33.0, 47.0, 76.0, 88.0, 187.0, 259.0, 367.0, 561.0, 887.0, 1275.0, 1871.0, 2928.0, 4533.0, 6947.0, 10696.0, 16655.0, 26641.0, 43161.0, 70977.0, 121433.0, 199898.0, 209463.0, 129467.0, 76164.0, 45486.0, 28128.0, 17811.0, 11217.0, 7318.0, 4810.0, 3086.0, 2012.0, 1354.0, 864.0, 595.0, 385.0, 284.0, 177.0, 115.0, 87.0, 40.0, 49.0, 18.0, 17.0, 8.0, 10.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-68.3125, -66.11328125, -63.9140625, -61.71484375, -59.515625, -57.31640625, -55.1171875, -52.91796875, -50.71875, -48.51953125, -46.3203125, -44.12109375, -41.921875, -39.72265625, -37.5234375, -35.32421875, -33.125, -30.92578125, -28.7265625, -26.52734375, -24.328125, -22.12890625, -19.9296875, -17.73046875, -15.53125, -13.33203125, -11.1328125, -8.93359375, -6.734375, -4.53515625, -2.3359375, -0.13671875, 2.0625, 4.26171875, 6.4609375, 8.66015625, 10.859375, 13.05859375, 15.2578125, 17.45703125, 19.65625, 21.85546875, 24.0546875, 26.25390625, 28.453125, 30.65234375, 32.8515625, 35.05078125, 37.25, 39.44921875, 41.6484375, 43.84765625, 46.046875, 48.24609375, 50.4453125, 52.64453125, 54.84375, 57.04296875, 59.2421875, 61.44140625, 63.640625, 65.83984375, 68.0390625, 70.23828125, 72.4375]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 7.0, 4.0, 7.0, 9.0, 14.0, 12.0, 8.0, 22.0, 14.0, 30.0, 16.0, 22.0, 23.0, 29.0, 38.0, 31.0, 32.0, 31.0, 34.0, 53.0, 34.0, 31.0, 38.0, 45.0, 44.0, 47.0, 34.0, 28.0, 34.0, 35.0, 21.0, 29.0, 20.0, 18.0, 20.0, 23.0, 12.0, 13.0, 12.0, 3.0, 4.0, 11.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-40.75, -39.6064453125, -38.462890625, -37.3193359375, -36.17578125, -35.0322265625, -33.888671875, -32.7451171875, -31.6015625, -30.4580078125, -29.314453125, -28.1708984375, -27.02734375, -25.8837890625, -24.740234375, -23.5966796875, -22.453125, -21.3095703125, -20.166015625, -19.0224609375, -17.87890625, -16.7353515625, -15.591796875, -14.4482421875, -13.3046875, -12.1611328125, -11.017578125, -9.8740234375, -8.73046875, -7.5869140625, -6.443359375, -5.2998046875, -4.15625, -3.0126953125, -1.869140625, -0.7255859375, 0.41796875, 1.5615234375, 2.705078125, 3.8486328125, 4.9921875, 6.1357421875, 7.279296875, 8.4228515625, 9.56640625, 10.7099609375, 11.853515625, 12.9970703125, 14.140625, 15.2841796875, 16.427734375, 17.5712890625, 18.71484375, 19.8583984375, 21.001953125, 22.1455078125, 23.2890625, 24.4326171875, 25.576171875, 26.7197265625, 27.86328125, 29.0068359375, 30.150390625, 31.2939453125, 32.4375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 8.0, 16.0, 16.0, 28.0, 43.0, 60.0, 93.0, 125.0, 214.0, 350.0, 529.0, 885.0, 1376.0, 2100.0, 3353.0, 5444.0, 9027.0, 14645.0, 25027.0, 43067.0, 78024.0, 151282.0, 267695.0, 203671.0, 105244.0, 56137.0, 32068.0, 18766.0, 11161.0, 6688.0, 4270.0, 2675.0, 1573.0, 1054.0, 659.0, 412.0, 260.0, 208.0, 117.0, 68.0, 46.0, 26.0, 20.0, 11.0, 12.0, 1.0, 0.0, 6.0, 1.0, 0.0, 5.0, 1.0], "bins": [-83.9375, -81.5205078125, -79.103515625, -76.6865234375, -74.26953125, -71.8525390625, -69.435546875, -67.0185546875, -64.6015625, -62.1845703125, -59.767578125, -57.3505859375, -54.93359375, -52.5166015625, -50.099609375, -47.6826171875, -45.265625, -42.8486328125, -40.431640625, -38.0146484375, -35.59765625, -33.1806640625, -30.763671875, -28.3466796875, -25.9296875, -23.5126953125, -21.095703125, -18.6787109375, -16.26171875, -13.8447265625, -11.427734375, -9.0107421875, -6.59375, -4.1767578125, -1.759765625, 0.6572265625, 3.07421875, 5.4912109375, 7.908203125, 10.3251953125, 12.7421875, 15.1591796875, 17.576171875, 19.9931640625, 22.41015625, 24.8271484375, 27.244140625, 29.6611328125, 32.078125, 34.4951171875, 36.912109375, 39.3291015625, 41.74609375, 44.1630859375, 46.580078125, 48.9970703125, 51.4140625, 53.8310546875, 56.248046875, 58.6650390625, 61.08203125, 63.4990234375, 65.916015625, 68.3330078125, 70.75]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 7.0, 10.0, 10.0, 13.0, 9.0, 17.0, 21.0, 17.0, 25.0, 34.0, 35.0, 39.0, 39.0, 41.0, 52.0, 38.0, 44.0, 54.0, 37.0, 54.0, 50.0, 34.0, 35.0, 34.0, 36.0, 38.0, 29.0, 23.0, 22.0, 23.0, 13.0, 13.0, 11.0, 8.0, 7.0, 5.0, 8.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.90625, -27.94775390625, -26.9892578125, -26.03076171875, -25.072265625, -24.11376953125, -23.1552734375, -22.19677734375, -21.23828125, -20.27978515625, -19.3212890625, -18.36279296875, -17.404296875, -16.44580078125, -15.4873046875, -14.52880859375, -13.5703125, -12.61181640625, -11.6533203125, -10.69482421875, -9.736328125, -8.77783203125, -7.8193359375, -6.86083984375, -5.90234375, -4.94384765625, -3.9853515625, -3.02685546875, -2.068359375, -1.10986328125, -0.1513671875, 0.80712890625, 1.765625, 2.72412109375, 3.6826171875, 4.64111328125, 5.599609375, 6.55810546875, 7.5166015625, 8.47509765625, 9.43359375, 10.39208984375, 11.3505859375, 12.30908203125, 13.267578125, 14.22607421875, 15.1845703125, 16.14306640625, 17.1015625, 18.06005859375, 19.0185546875, 19.97705078125, 20.935546875, 21.89404296875, 22.8525390625, 23.81103515625, 24.76953125, 25.72802734375, 26.6865234375, 27.64501953125, 28.603515625, 29.56201171875, 30.5205078125, 31.47900390625, 32.4375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 5.0, 12.0, 16.0, 12.0, 26.0, 39.0, 40.0, 57.0, 88.0, 117.0, 146.0, 230.0, 346.0, 491.0, 626.0, 1016.0, 1525.0, 2486.0, 4097.0, 7783.0, 17271.0, 48270.0, 228996.0, 603869.0, 80881.0, 25704.0, 10592.0, 5260.0, 2927.0, 1846.0, 1197.0, 778.0, 525.0, 385.0, 253.0, 171.0, 139.0, 100.0, 71.0, 48.0, 32.0, 16.0, 16.0, 13.0, 9.0, 11.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-138.875, -134.5625, -130.25, -125.9375, -121.625, -117.3125, -113.0, -108.6875, -104.375, -100.0625, -95.75, -91.4375, -87.125, -82.8125, -78.5, -74.1875, -69.875, -65.5625, -61.25, -56.9375, -52.625, -48.3125, -44.0, -39.6875, -35.375, -31.0625, -26.75, -22.4375, -18.125, -13.8125, -9.5, -5.1875, -0.875, 3.4375, 7.75, 12.0625, 16.375, 20.6875, 25.0, 29.3125, 33.625, 37.9375, 42.25, 46.5625, 50.875, 55.1875, 59.5, 63.8125, 68.125, 72.4375, 76.75, 81.0625, 85.375, 89.6875, 94.0, 98.3125, 102.625, 106.9375, 111.25, 115.5625, 119.875, 124.1875, 128.5, 132.8125, 137.125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 4.0, 3.0, 5.0, 8.0, 12.0, 17.0, 15.0, 39.0, 54.0, 87.0, 137.0, 191.0, 141.0, 107.0, 57.0, 29.0, 28.0, 15.0, 10.0, 6.0, 9.0, 7.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005390167236328125, -0.005214273929595947, -0.0050383806228637695, -0.004862487316131592, -0.004686594009399414, -0.004510700702667236, -0.004334807395935059, -0.004158914089202881, -0.003983020782470703, -0.0038071274757385254, -0.0036312341690063477, -0.00345534086227417, -0.003279447555541992, -0.0031035542488098145, -0.0029276609420776367, -0.002751767635345459, -0.0025758743286132812, -0.0023999810218811035, -0.0022240877151489258, -0.002048194408416748, -0.0018723011016845703, -0.0016964077949523926, -0.0015205144882202148, -0.0013446211814880371, -0.0011687278747558594, -0.0009928345680236816, -0.0008169412612915039, -0.0006410479545593262, -0.00046515464782714844, -0.0002892613410949707, -0.00011336803436279297, 6.252527236938477e-05, 0.0002384185791015625, 0.00041431188583374023, 0.000590205192565918, 0.0007660984992980957, 0.0009419918060302734, 0.0011178851127624512, 0.001293778419494629, 0.0014696717262268066, 0.0016455650329589844, 0.0018214583396911621, 0.00199735164642334, 0.0021732449531555176, 0.0023491382598876953, 0.002525031566619873, 0.0027009248733520508, 0.0028768181800842285, 0.0030527114868164062, 0.003228604793548584, 0.0034044981002807617, 0.0035803914070129395, 0.003756284713745117, 0.003932178020477295, 0.004108071327209473, 0.00428396463394165, 0.004459857940673828, 0.004635751247406006, 0.004811644554138184, 0.004987537860870361, 0.005163431167602539, 0.005339324474334717, 0.0055152177810668945, 0.005691111087799072, 0.00586700439453125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 9.0, 8.0, 11.0, 9.0, 19.0, 12.0, 36.0, 37.0, 68.0, 98.0, 139.0, 203.0, 342.0, 494.0, 852.0, 1629.0, 3106.0, 6991.0, 20329.0, 102576.0, 767900.0, 108487.0, 20804.0, 7096.0, 3232.0, 1615.0, 907.0, 504.0, 328.0, 213.0, 144.0, 101.0, 68.0, 48.0, 34.0, 19.0, 16.0, 15.0, 10.0, 13.0, 4.0, 10.0, 4.0, 4.0, 1.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-198.125, -191.837890625, -185.55078125, -179.263671875, -172.9765625, -166.689453125, -160.40234375, -154.115234375, -147.828125, -141.541015625, -135.25390625, -128.966796875, -122.6796875, -116.392578125, -110.10546875, -103.818359375, -97.53125, -91.244140625, -84.95703125, -78.669921875, -72.3828125, -66.095703125, -59.80859375, -53.521484375, -47.234375, -40.947265625, -34.66015625, -28.373046875, -22.0859375, -15.798828125, -9.51171875, -3.224609375, 3.0625, 9.349609375, 15.63671875, 21.923828125, 28.2109375, 34.498046875, 40.78515625, 47.072265625, 53.359375, 59.646484375, 65.93359375, 72.220703125, 78.5078125, 84.794921875, 91.08203125, 97.369140625, 103.65625, 109.943359375, 116.23046875, 122.517578125, 128.8046875, 135.091796875, 141.37890625, 147.666015625, 153.953125, 160.240234375, 166.52734375, 172.814453125, 179.1015625, 185.388671875, 191.67578125, 197.962890625, 204.25]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 3.0, 10.0, 11.0, 13.0, 11.0, 25.0, 46.0, 70.0, 120.0, 141.0, 152.0, 149.0, 66.0, 60.0, 44.0, 27.0, 14.0, 6.0, 8.0, 0.0, 5.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-60.46875, -59.068603515625, -57.66845703125, -56.268310546875, -54.8681640625, -53.468017578125, -52.06787109375, -50.667724609375, -49.267578125, -47.867431640625, -46.46728515625, -45.067138671875, -43.6669921875, -42.266845703125, -40.86669921875, -39.466552734375, -38.06640625, -36.666259765625, -35.26611328125, -33.865966796875, -32.4658203125, -31.065673828125, -29.66552734375, -28.265380859375, -26.865234375, -25.465087890625, -24.06494140625, -22.664794921875, -21.2646484375, -19.864501953125, -18.46435546875, -17.064208984375, -15.6640625, -14.263916015625, -12.86376953125, -11.463623046875, -10.0634765625, -8.663330078125, -7.26318359375, -5.863037109375, -4.462890625, -3.062744140625, -1.66259765625, -0.262451171875, 1.1376953125, 2.537841796875, 3.93798828125, 5.338134765625, 6.73828125, 8.138427734375, 9.53857421875, 10.938720703125, 12.3388671875, 13.739013671875, 15.13916015625, 16.539306640625, 17.939453125, 19.339599609375, 20.73974609375, 22.139892578125, 23.5400390625, 24.940185546875, 26.34033203125, 27.740478515625, 29.140625]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 6.0, 6.0, 13.0, 16.0, 17.0, 31.0, 40.0, 38.0, 47.0, 56.0, 77.0, 87.0, 95.0, 67.0, 55.0, 62.0, 43.0, 34.0, 32.0, 25.0, 22.0, 28.0, 22.0, 10.0, 9.0, 9.0, 3.0, 6.0, 13.0, 0.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.24359130859375, -38.55179977416992, -36.86001205444336, -35.16822052001953, -33.4764289855957, -31.784639358520508, -30.092849731445312, -28.401058197021484, -26.709266662597656, -25.01747703552246, -23.325685501098633, -21.633895874023438, -19.94210433959961, -18.250314712524414, -16.55852508544922, -14.86673355102539, -13.174943923950195, -11.483153343200684, -9.791362762451172, -8.099573135375977, -6.407782077789307, -4.715991973876953, -3.0242013931274414, -1.3324108123779297, 0.35937976837158203, 2.0511703491210938, 3.7429606914520264, 5.434751033782959, 7.126541614532471, 8.818331718444824, 10.510122299194336, 12.201912879943848, 13.89370346069336, 15.585494041442871, 17.277284622192383, 18.969074249267578, 20.660865783691406, 22.3526554107666, 24.044445037841797, 25.736236572265625, 27.428028106689453, 29.11981773376465, 30.811609268188477, 32.50339889526367, 34.1951904296875, 35.88697814941406, 37.57876968383789, 39.27056121826172, 40.96234893798828, 42.65414047241211, 44.34592819213867, 46.0377197265625, 47.72951126098633, 49.421302795410156, 51.11309051513672, 52.80488204956055, 54.496673583984375, 56.1884651184082, 57.880252838134766, 59.572044372558594, 61.26383590698242, 62.95562744140625, 64.64741516113281, 66.33920288085938, 68.03099822998047]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 5.0, 5.0, 5.0, 9.0, 9.0, 13.0, 10.0, 17.0, 19.0, 20.0, 27.0, 21.0, 25.0, 34.0, 28.0, 33.0, 36.0, 26.0, 20.0, 39.0, 37.0, 29.0, 41.0, 39.0, 34.0, 29.0, 44.0, 38.0, 32.0, 31.0, 20.0, 37.0, 30.0, 21.0, 21.0, 25.0, 11.0, 16.0, 8.0, 17.0, 10.0, 6.0, 9.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-45.97113037109375, -44.62940216064453, -43.28767395019531, -41.945945739746094, -40.604217529296875, -39.26249313354492, -37.9207649230957, -36.579036712646484, -35.237308502197266, -33.89558029174805, -32.55385208129883, -31.212125778198242, -29.870397567749023, -28.528669357299805, -27.18694305419922, -25.84521484375, -24.50348663330078, -23.161758422851562, -21.820030212402344, -20.478303909301758, -19.13657569885254, -17.79484748840332, -16.453121185302734, -15.111392974853516, -13.769664764404297, -12.427936553955078, -11.086209297180176, -9.744482040405273, -8.402753829956055, -7.061026096343994, -5.719298362731934, -4.377571105957031, -3.035846710205078, -1.6941189765930176, -0.35239124298095703, 0.9893364906311035, 2.331064224243164, 3.6727919578552246, 5.014519691467285, 6.3562469482421875, 7.697975158691406, 9.039703369140625, 10.381430625915527, 11.72315788269043, 13.064886093139648, 14.406614303588867, 15.74834156036377, 17.090068817138672, 18.43179702758789, 19.77352523803711, 21.115253448486328, 22.456979751586914, 23.798707962036133, 25.14043617248535, 26.482162475585938, 27.823890686035156, 29.165618896484375, 30.507347106933594, 31.849075317382812, 33.19080352783203, 34.53253173828125, 35.8742561340332, 37.21598434448242, 38.55771255493164, 39.89944076538086]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 7.0, 11.0, 17.0, 27.0, 36.0, 44.0, 68.0, 115.0, 160.0, 261.0, 337.0, 555.0, 813.0, 1326.0, 1945.0, 3213.0, 5192.0, 8479.0, 14416.0, 24181.0, 42878.0, 79726.0, 160699.0, 483523.0, 1886383.0, 1001721.0, 244640.0, 108219.0, 55551.0, 29988.0, 16459.0, 9531.0, 5389.0, 3195.0, 2004.0, 1199.0, 713.0, 446.0, 283.0, 177.0, 116.0, 84.0, 47.0, 31.0, 30.0, 23.0, 9.0, 8.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-65.3125, -63.31591796875, -61.3193359375, -59.32275390625, -57.326171875, -55.32958984375, -53.3330078125, -51.33642578125, -49.33984375, -47.34326171875, -45.3466796875, -43.35009765625, -41.353515625, -39.35693359375, -37.3603515625, -35.36376953125, -33.3671875, -31.37060546875, -29.3740234375, -27.37744140625, -25.380859375, -23.38427734375, -21.3876953125, -19.39111328125, -17.39453125, -15.39794921875, -13.4013671875, -11.40478515625, -9.408203125, -7.41162109375, -5.4150390625, -3.41845703125, -1.421875, 0.57470703125, 2.5712890625, 4.56787109375, 6.564453125, 8.56103515625, 10.5576171875, 12.55419921875, 14.55078125, 16.54736328125, 18.5439453125, 20.54052734375, 22.537109375, 24.53369140625, 26.5302734375, 28.52685546875, 30.5234375, 32.52001953125, 34.5166015625, 36.51318359375, 38.509765625, 40.50634765625, 42.5029296875, 44.49951171875, 46.49609375, 48.49267578125, 50.4892578125, 52.48583984375, 54.482421875, 56.47900390625, 58.4755859375, 60.47216796875, 62.46875]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 7.0, 4.0, 4.0, 2.0, 9.0, 8.0, 8.0, 11.0, 16.0, 15.0, 21.0, 27.0, 25.0, 27.0, 28.0, 36.0, 32.0, 36.0, 38.0, 36.0, 37.0, 36.0, 34.0, 49.0, 43.0, 27.0, 40.0, 36.0, 42.0, 37.0, 36.0, 24.0, 37.0, 33.0, 19.0, 17.0, 17.0, 13.0, 8.0, 9.0, 8.0, 8.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.09375, -22.319091796875, -21.54443359375, -20.769775390625, -19.9951171875, -19.220458984375, -18.44580078125, -17.671142578125, -16.896484375, -16.121826171875, -15.34716796875, -14.572509765625, -13.7978515625, -13.023193359375, -12.24853515625, -11.473876953125, -10.69921875, -9.924560546875, -9.14990234375, -8.375244140625, -7.6005859375, -6.825927734375, -6.05126953125, -5.276611328125, -4.501953125, -3.727294921875, -2.95263671875, -2.177978515625, -1.4033203125, -0.628662109375, 0.14599609375, 0.920654296875, 1.6953125, 2.469970703125, 3.24462890625, 4.019287109375, 4.7939453125, 5.568603515625, 6.34326171875, 7.117919921875, 7.892578125, 8.667236328125, 9.44189453125, 10.216552734375, 10.9912109375, 11.765869140625, 12.54052734375, 13.315185546875, 14.08984375, 14.864501953125, 15.63916015625, 16.413818359375, 17.1884765625, 17.963134765625, 18.73779296875, 19.512451171875, 20.287109375, 21.061767578125, 21.83642578125, 22.611083984375, 23.3857421875, 24.160400390625, 24.93505859375, 25.709716796875, 26.484375]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 8.0, 11.0, 12.0, 20.0, 28.0, 32.0, 43.0, 65.0, 78.0, 106.0, 159.0, 286.0, 359.0, 559.0, 812.0, 1138.0, 1702.0, 2513.0, 3902.0, 6045.0, 9654.0, 16334.0, 27885.0, 50074.0, 96468.0, 205157.0, 505258.0, 1647244.0, 970770.0, 333398.0, 145696.0, 72249.0, 38197.0, 21971.0, 12993.0, 8015.0, 4996.0, 3374.0, 2173.0, 1431.0, 943.0, 635.0, 461.0, 322.0, 217.0, 145.0, 96.0, 74.0, 47.0, 42.0, 32.0, 21.0, 14.0, 13.0, 6.0, 9.0, 1.0, 2.0, 1.0], "bins": [-49.0625, -47.56591796875, -46.0693359375, -44.57275390625, -43.076171875, -41.57958984375, -40.0830078125, -38.58642578125, -37.08984375, -35.59326171875, -34.0966796875, -32.60009765625, -31.103515625, -29.60693359375, -28.1103515625, -26.61376953125, -25.1171875, -23.62060546875, -22.1240234375, -20.62744140625, -19.130859375, -17.63427734375, -16.1376953125, -14.64111328125, -13.14453125, -11.64794921875, -10.1513671875, -8.65478515625, -7.158203125, -5.66162109375, -4.1650390625, -2.66845703125, -1.171875, 0.32470703125, 1.8212890625, 3.31787109375, 4.814453125, 6.31103515625, 7.8076171875, 9.30419921875, 10.80078125, 12.29736328125, 13.7939453125, 15.29052734375, 16.787109375, 18.28369140625, 19.7802734375, 21.27685546875, 22.7734375, 24.27001953125, 25.7666015625, 27.26318359375, 28.759765625, 30.25634765625, 31.7529296875, 33.24951171875, 34.74609375, 36.24267578125, 37.7392578125, 39.23583984375, 40.732421875, 42.22900390625, 43.7255859375, 45.22216796875, 46.71875]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 10.0, 9.0, 15.0, 12.0, 24.0, 21.0, 36.0, 49.0, 39.0, 58.0, 85.0, 93.0, 143.0, 148.0, 188.0, 263.0, 322.0, 442.0, 456.0, 382.0, 261.0, 222.0, 151.0, 140.0, 105.0, 82.0, 71.0, 49.0, 38.0, 36.0, 24.0, 17.0, 20.0, 10.0, 12.0, 11.0, 6.0, 8.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.015625, -16.53369140625, -16.0517578125, -15.56982421875, -15.087890625, -14.60595703125, -14.1240234375, -13.64208984375, -13.16015625, -12.67822265625, -12.1962890625, -11.71435546875, -11.232421875, -10.75048828125, -10.2685546875, -9.78662109375, -9.3046875, -8.82275390625, -8.3408203125, -7.85888671875, -7.376953125, -6.89501953125, -6.4130859375, -5.93115234375, -5.44921875, -4.96728515625, -4.4853515625, -4.00341796875, -3.521484375, -3.03955078125, -2.5576171875, -2.07568359375, -1.59375, -1.11181640625, -0.6298828125, -0.14794921875, 0.333984375, 0.81591796875, 1.2978515625, 1.77978515625, 2.26171875, 2.74365234375, 3.2255859375, 3.70751953125, 4.189453125, 4.67138671875, 5.1533203125, 5.63525390625, 6.1171875, 6.59912109375, 7.0810546875, 7.56298828125, 8.044921875, 8.52685546875, 9.0087890625, 9.49072265625, 9.97265625, 10.45458984375, 10.9365234375, 11.41845703125, 11.900390625, 12.38232421875, 12.8642578125, 13.34619140625, 13.828125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 10.0, 3.0, 6.0, 7.0, 5.0, 11.0, 7.0, 21.0, 26.0, 44.0, 37.0, 72.0, 77.0, 87.0, 107.0, 117.0, 83.0, 79.0, 43.0, 32.0, 30.0, 15.0, 28.0, 10.0, 19.0, 6.0, 5.0, 7.0, 7.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.72951126098633, -38.3490104675293, -36.968505859375, -35.58800506591797, -34.20750427246094, -32.82699966430664, -31.44649887084961, -30.065996170043945, -28.68549346923828, -27.304990768432617, -25.924489974975586, -24.543987274169922, -23.163484573364258, -21.782981872558594, -20.402481079101562, -19.0219783782959, -17.641477584838867, -16.260974884033203, -14.880473136901855, -13.499971389770508, -12.119468688964844, -10.738966941833496, -9.358465194702148, -7.977962493896484, -6.597460746765137, -5.216958522796631, -3.836456537246704, -2.4559545516967773, -1.0754523277282715, 0.3050498962402344, 1.685551643371582, 3.066054344177246, 4.446556091308594, 5.8270583152771, 7.2075605392456055, 8.588062286376953, 9.968564987182617, 11.349066734313965, 12.729568481445312, 14.110071182250977, 15.490572929382324, 16.871074676513672, 18.251577377319336, 19.632080078125, 21.01258087158203, 22.393083572387695, 23.77358627319336, 25.15408706665039, 26.534589767456055, 27.91509246826172, 29.29559326171875, 30.676095962524414, 32.05659866333008, 33.43709945678711, 34.817604064941406, 36.19810485839844, 37.57860565185547, 38.9591064453125, 40.3396110534668, 41.72011184692383, 43.10061264038086, 44.481117248535156, 45.86161804199219, 47.24211883544922, 48.622623443603516]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 6.0, 7.0, 6.0, 8.0, 14.0, 14.0, 20.0, 14.0, 25.0, 24.0, 20.0, 30.0, 30.0, 32.0, 31.0, 38.0, 34.0, 21.0, 37.0, 36.0, 35.0, 27.0, 48.0, 32.0, 39.0, 51.0, 34.0, 35.0, 30.0, 32.0, 28.0, 22.0, 17.0, 22.0, 19.0, 12.0, 10.0, 12.0, 9.0, 8.0, 7.0, 2.0, 2.0, 1.0, 9.0, 3.0, 3.0, 0.0, 2.0, 2.0], "bins": [-27.813217163085938, -27.006799697875977, -26.200380325317383, -25.393962860107422, -24.587543487548828, -23.781126022338867, -22.974708557128906, -22.168289184570312, -21.36187171936035, -20.55545425415039, -19.749034881591797, -18.942617416381836, -18.136199951171875, -17.32978057861328, -16.52336311340332, -15.716944694519043, -14.910526275634766, -14.104107856750488, -13.297689437866211, -12.49127197265625, -11.684853553771973, -10.878435134887695, -10.072017669677734, -9.265599250793457, -8.45918083190918, -7.652762413024902, -6.846344470977783, -6.039926528930664, -5.233508110046387, -4.427089691162109, -3.6206717491149902, -2.814253807067871, -2.0078353881835938, -1.2014172077178955, -0.39499902725219727, 0.411419153213501, 1.2178373336791992, 2.0242557525634766, 2.8306736946105957, 3.637091636657715, 4.443510055541992, 5.2499284744262695, 6.056346416473389, 6.862764358520508, 7.669182777404785, 8.475601196289062, 9.282018661499023, 10.0884370803833, 10.894855499267578, 11.701273918151855, 12.507692337036133, 13.314109802246094, 14.120528221130371, 14.926946640014648, 15.73336410522461, 16.539783477783203, 17.346200942993164, 18.152618408203125, 18.95903778076172, 19.76545524597168, 20.57187271118164, 21.378292083740234, 22.184709548950195, 22.991127014160156, 23.79754638671875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 5.0, 12.0, 9.0, 11.0, 19.0, 31.0, 53.0, 68.0, 93.0, 146.0, 243.0, 363.0, 563.0, 931.0, 1564.0, 2555.0, 4351.0, 7477.0, 13318.0, 23163.0, 41536.0, 76784.0, 150270.0, 281182.0, 209800.0, 105971.0, 56088.0, 30553.0, 17315.0, 9906.0, 5709.0, 3316.0, 1933.0, 1201.0, 720.0, 442.0, 313.0, 173.0, 138.0, 79.0, 55.0, 31.0, 24.0, 17.0, 11.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.28125, -13.8450927734375, -13.408935546875, -12.9727783203125, -12.53662109375, -12.1004638671875, -11.664306640625, -11.2281494140625, -10.7919921875, -10.3558349609375, -9.919677734375, -9.4835205078125, -9.04736328125, -8.6112060546875, -8.175048828125, -7.7388916015625, -7.302734375, -6.8665771484375, -6.430419921875, -5.9942626953125, -5.55810546875, -5.1219482421875, -4.685791015625, -4.2496337890625, -3.8134765625, -3.3773193359375, -2.941162109375, -2.5050048828125, -2.06884765625, -1.6326904296875, -1.196533203125, -0.7603759765625, -0.32421875, 0.1119384765625, 0.548095703125, 0.9842529296875, 1.42041015625, 1.8565673828125, 2.292724609375, 2.7288818359375, 3.1650390625, 3.6011962890625, 4.037353515625, 4.4735107421875, 4.90966796875, 5.3458251953125, 5.781982421875, 6.2181396484375, 6.654296875, 7.0904541015625, 7.526611328125, 7.9627685546875, 8.39892578125, 8.8350830078125, 9.271240234375, 9.7073974609375, 10.1435546875, 10.5797119140625, 11.015869140625, 11.4520263671875, 11.88818359375, 12.3243408203125, 12.760498046875, 13.1966552734375, 13.6328125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 4.0, 3.0, 3.0, 7.0, 8.0, 10.0, 6.0, 17.0, 23.0, 17.0, 19.0, 23.0, 19.0, 38.0, 36.0, 31.0, 38.0, 27.0, 35.0, 44.0, 32.0, 34.0, 40.0, 34.0, 37.0, 33.0, 35.0, 46.0, 40.0, 30.0, 27.0, 33.0, 31.0, 22.0, 18.0, 21.0, 15.0, 14.0, 12.0, 13.0, 3.0, 8.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-27.0625, -26.23193359375, -25.4013671875, -24.57080078125, -23.740234375, -22.90966796875, -22.0791015625, -21.24853515625, -20.41796875, -19.58740234375, -18.7568359375, -17.92626953125, -17.095703125, -16.26513671875, -15.4345703125, -14.60400390625, -13.7734375, -12.94287109375, -12.1123046875, -11.28173828125, -10.451171875, -9.62060546875, -8.7900390625, -7.95947265625, -7.12890625, -6.29833984375, -5.4677734375, -4.63720703125, -3.806640625, -2.97607421875, -2.1455078125, -1.31494140625, -0.484375, 0.34619140625, 1.1767578125, 2.00732421875, 2.837890625, 3.66845703125, 4.4990234375, 5.32958984375, 6.16015625, 6.99072265625, 7.8212890625, 8.65185546875, 9.482421875, 10.31298828125, 11.1435546875, 11.97412109375, 12.8046875, 13.63525390625, 14.4658203125, 15.29638671875, 16.126953125, 16.95751953125, 17.7880859375, 18.61865234375, 19.44921875, 20.27978515625, 21.1103515625, 21.94091796875, 22.771484375, 23.60205078125, 24.4326171875, 25.26318359375, 26.09375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 2.0, 2.0, 9.0, 5.0, 12.0, 17.0, 16.0, 28.0, 43.0, 60.0, 88.0, 110.0, 172.0, 234.0, 345.0, 502.0, 842.0, 1181.0, 1762.0, 2967.0, 4734.0, 7684.0, 13482.0, 23575.0, 42968.0, 83068.0, 176097.0, 333529.0, 173427.0, 81819.0, 42455.0, 23513.0, 13137.0, 7642.0, 4587.0, 2955.0, 1884.0, 1217.0, 742.0, 542.0, 340.0, 239.0, 137.0, 114.0, 84.0, 58.0, 30.0, 33.0, 24.0, 12.0, 11.0, 9.0, 6.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-10.6484375, -10.2991943359375, -9.949951171875, -9.6007080078125, -9.25146484375, -8.9022216796875, -8.552978515625, -8.2037353515625, -7.8544921875, -7.5052490234375, -7.156005859375, -6.8067626953125, -6.45751953125, -6.1082763671875, -5.759033203125, -5.4097900390625, -5.060546875, -4.7113037109375, -4.362060546875, -4.0128173828125, -3.66357421875, -3.3143310546875, -2.965087890625, -2.6158447265625, -2.2666015625, -1.9173583984375, -1.568115234375, -1.2188720703125, -0.86962890625, -0.5203857421875, -0.171142578125, 0.1781005859375, 0.52734375, 0.8765869140625, 1.225830078125, 1.5750732421875, 1.92431640625, 2.2735595703125, 2.622802734375, 2.9720458984375, 3.3212890625, 3.6705322265625, 4.019775390625, 4.3690185546875, 4.71826171875, 5.0675048828125, 5.416748046875, 5.7659912109375, 6.115234375, 6.4644775390625, 6.813720703125, 7.1629638671875, 7.51220703125, 7.8614501953125, 8.210693359375, 8.5599365234375, 8.9091796875, 9.2584228515625, 9.607666015625, 9.9569091796875, 10.30615234375, 10.6553955078125, 11.004638671875, 11.3538818359375, 11.703125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 4.0, 5.0, 7.0, 11.0, 14.0, 11.0, 18.0, 20.0, 22.0, 14.0, 21.0, 29.0, 36.0, 30.0, 30.0, 34.0, 37.0, 44.0, 27.0, 47.0, 46.0, 48.0, 30.0, 53.0, 38.0, 37.0, 37.0, 27.0, 27.0, 25.0, 35.0, 29.0, 14.0, 15.0, 20.0, 7.0, 9.0, 10.0, 12.0, 5.0, 3.0, 5.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.28125, -18.698486328125, -18.11572265625, -17.532958984375, -16.9501953125, -16.367431640625, -15.78466796875, -15.201904296875, -14.619140625, -14.036376953125, -13.45361328125, -12.870849609375, -12.2880859375, -11.705322265625, -11.12255859375, -10.539794921875, -9.95703125, -9.374267578125, -8.79150390625, -8.208740234375, -7.6259765625, -7.043212890625, -6.46044921875, -5.877685546875, -5.294921875, -4.712158203125, -4.12939453125, -3.546630859375, -2.9638671875, -2.381103515625, -1.79833984375, -1.215576171875, -0.6328125, -0.050048828125, 0.53271484375, 1.115478515625, 1.6982421875, 2.281005859375, 2.86376953125, 3.446533203125, 4.029296875, 4.612060546875, 5.19482421875, 5.777587890625, 6.3603515625, 6.943115234375, 7.52587890625, 8.108642578125, 8.69140625, 9.274169921875, 9.85693359375, 10.439697265625, 11.0224609375, 11.605224609375, 12.18798828125, 12.770751953125, 13.353515625, 13.936279296875, 14.51904296875, 15.101806640625, 15.6845703125, 16.267333984375, 16.85009765625, 17.432861328125, 18.015625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 8.0, 12.0, 14.0, 24.0, 29.0, 30.0, 49.0, 74.0, 105.0, 144.0, 191.0, 283.0, 428.0, 644.0, 913.0, 1421.0, 2297.0, 3591.0, 6219.0, 11226.0, 22271.0, 49630.0, 147354.0, 576735.0, 131339.0, 46304.0, 20787.0, 10562.0, 5959.0, 3522.0, 2169.0, 1373.0, 905.0, 618.0, 389.0, 256.0, 190.0, 163.0, 97.0, 63.0, 46.0, 25.0, 23.0, 22.0, 18.0, 12.0, 5.0, 6.0, 5.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.390625, -4.2415771484375, -4.092529296875, -3.9434814453125, -3.79443359375, -3.6453857421875, -3.496337890625, -3.3472900390625, -3.1982421875, -3.0491943359375, -2.900146484375, -2.7510986328125, -2.60205078125, -2.4530029296875, -2.303955078125, -2.1549072265625, -2.005859375, -1.8568115234375, -1.707763671875, -1.5587158203125, -1.40966796875, -1.2606201171875, -1.111572265625, -0.9625244140625, -0.8134765625, -0.6644287109375, -0.515380859375, -0.3663330078125, -0.21728515625, -0.0682373046875, 0.080810546875, 0.2298583984375, 0.37890625, 0.5279541015625, 0.677001953125, 0.8260498046875, 0.97509765625, 1.1241455078125, 1.273193359375, 1.4222412109375, 1.5712890625, 1.7203369140625, 1.869384765625, 2.0184326171875, 2.16748046875, 2.3165283203125, 2.465576171875, 2.6146240234375, 2.763671875, 2.9127197265625, 3.061767578125, 3.2108154296875, 3.35986328125, 3.5089111328125, 3.657958984375, 3.8070068359375, 3.9560546875, 4.1051025390625, 4.254150390625, 4.4031982421875, 4.55224609375, 4.7012939453125, 4.850341796875, 4.9993896484375, 5.1484375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 6.0, 7.0, 7.0, 8.0, 22.0, 18.0, 35.0, 40.0, 37.0, 52.0, 87.0, 88.0, 111.0, 89.0, 82.0, 72.0, 68.0, 50.0, 32.0, 22.0, 13.0, 14.0, 5.0, 9.0, 12.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000576019287109375, -0.000557340681552887, -0.0005386620759963989, -0.0005199834704399109, -0.0005013048648834229, -0.0004826262593269348, -0.0004639476537704468, -0.00044526904821395874, -0.0004265904426574707, -0.00040791183710098267, -0.00038923323154449463, -0.0003705546259880066, -0.00035187602043151855, -0.0003331974148750305, -0.0003145188093185425, -0.00029584020376205444, -0.0002771615982055664, -0.00025848299264907837, -0.00023980438709259033, -0.0002211257815361023, -0.00020244717597961426, -0.00018376857042312622, -0.00016508996486663818, -0.00014641135931015015, -0.0001277327537536621, -0.00010905414819717407, -9.037554264068604e-05, -7.1696937084198e-05, -5.301833152770996e-05, -3.4339725971221924e-05, -1.5661120414733887e-05, 3.0174851417541504e-06, 2.1696090698242188e-05, 4.0374696254730225e-05, 5.905330181121826e-05, 7.77319073677063e-05, 9.641051292419434e-05, 0.00011508911848068237, 0.0001337677240371704, 0.00015244632959365845, 0.00017112493515014648, 0.00018980354070663452, 0.00020848214626312256, 0.0002271607518196106, 0.00024583935737609863, 0.00026451796293258667, 0.0002831965684890747, 0.00030187517404556274, 0.0003205537796020508, 0.0003392323851585388, 0.00035791099071502686, 0.0003765895962715149, 0.00039526820182800293, 0.00041394680738449097, 0.000432625412940979, 0.00045130401849746704, 0.0004699826240539551, 0.0004886612296104431, 0.0005073398351669312, 0.0005260184407234192, 0.0005446970462799072, 0.0005633756518363953, 0.0005820542573928833, 0.0006007328629493713, 0.0006194114685058594]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 0.0, 9.0, 4.0, 5.0, 6.0, 12.0, 15.0, 40.0, 47.0, 64.0, 112.0, 139.0, 231.0, 296.0, 383.0, 575.0, 811.0, 1209.0, 1696.0, 2538.0, 3682.0, 5353.0, 8551.0, 12949.0, 20335.0, 32305.0, 54107.0, 93954.0, 294493.0, 277888.0, 92934.0, 53220.0, 32107.0, 20135.0, 12827.0, 8295.0, 5425.0, 3663.0, 2498.0, 1677.0, 1263.0, 810.0, 569.0, 399.0, 276.0, 201.0, 155.0, 111.0, 63.0, 49.0, 31.0, 16.0, 12.0, 9.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-12.1953125, -11.8140869140625, -11.432861328125, -11.0516357421875, -10.67041015625, -10.2891845703125, -9.907958984375, -9.5267333984375, -9.1455078125, -8.7642822265625, -8.383056640625, -8.0018310546875, -7.62060546875, -7.2393798828125, -6.858154296875, -6.4769287109375, -6.095703125, -5.7144775390625, -5.333251953125, -4.9520263671875, -4.57080078125, -4.1895751953125, -3.808349609375, -3.4271240234375, -3.0458984375, -2.6646728515625, -2.283447265625, -1.9022216796875, -1.52099609375, -1.1397705078125, -0.758544921875, -0.3773193359375, 0.00390625, 0.3851318359375, 0.766357421875, 1.1475830078125, 1.52880859375, 1.9100341796875, 2.291259765625, 2.6724853515625, 3.0537109375, 3.4349365234375, 3.816162109375, 4.1973876953125, 4.57861328125, 4.9598388671875, 5.341064453125, 5.7222900390625, 6.103515625, 6.4847412109375, 6.865966796875, 7.2471923828125, 7.62841796875, 8.0096435546875, 8.390869140625, 8.7720947265625, 9.1533203125, 9.5345458984375, 9.915771484375, 10.2969970703125, 10.67822265625, 11.0594482421875, 11.440673828125, 11.8218994140625, 12.203125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 7.0, 2.0, 4.0, 8.0, 8.0, 16.0, 17.0, 21.0, 15.0, 25.0, 24.0, 16.0, 30.0, 29.0, 32.0, 25.0, 22.0, 24.0, 33.0, 59.0, 59.0, 102.0, 48.0, 27.0, 28.0, 34.0, 29.0, 38.0, 37.0, 28.0, 19.0, 18.0, 20.0, 13.0, 13.0, 13.0, 14.0, 6.0, 8.0, 8.0, 6.0, 7.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9765625, -2.865478515625, -2.75439453125, -2.643310546875, -2.5322265625, -2.421142578125, -2.31005859375, -2.198974609375, -2.087890625, -1.976806640625, -1.86572265625, -1.754638671875, -1.6435546875, -1.532470703125, -1.42138671875, -1.310302734375, -1.19921875, -1.088134765625, -0.97705078125, -0.865966796875, -0.7548828125, -0.643798828125, -0.53271484375, -0.421630859375, -0.310546875, -0.199462890625, -0.08837890625, 0.022705078125, 0.1337890625, 0.244873046875, 0.35595703125, 0.467041015625, 0.578125, 0.689208984375, 0.80029296875, 0.911376953125, 1.0224609375, 1.133544921875, 1.24462890625, 1.355712890625, 1.466796875, 1.577880859375, 1.68896484375, 1.800048828125, 1.9111328125, 2.022216796875, 2.13330078125, 2.244384765625, 2.35546875, 2.466552734375, 2.57763671875, 2.688720703125, 2.7998046875, 2.910888671875, 3.02197265625, 3.133056640625, 3.244140625, 3.355224609375, 3.46630859375, 3.577392578125, 3.6884765625, 3.799560546875, 3.91064453125, 4.021728515625, 4.1328125]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 4.0, 9.0, 4.0, 4.0, 7.0, 13.0, 15.0, 22.0, 29.0, 42.0, 55.0, 72.0, 85.0, 123.0, 108.0, 98.0, 74.0, 55.0, 33.0, 33.0, 27.0, 23.0, 19.0, 17.0, 6.0, 9.0, 5.0, 6.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.61536407470703, -46.085025787353516, -44.5546875, -43.024349212646484, -41.49401092529297, -39.96366882324219, -38.43333053588867, -36.902992248535156, -35.37265396118164, -33.842315673828125, -32.31197738647461, -30.78163719177246, -29.251298904418945, -27.72096061706543, -26.19062042236328, -24.660282135009766, -23.12994384765625, -21.599605560302734, -20.06926727294922, -18.53892707824707, -17.008588790893555, -15.478250503540039, -13.947911262512207, -12.417572021484375, -10.88723373413086, -9.356895446777344, -7.826556205749512, -6.296217441558838, -4.765878677368164, -3.2355399131774902, -1.7052011489868164, -0.17486190795898438, 1.3554725646972656, 2.8858113288879395, 4.416150093078613, 5.946488857269287, 7.476827621459961, 9.007165908813477, 10.537505149841309, 12.06784439086914, 13.598182678222656, 15.128520965576172, 16.658859252929688, 18.189199447631836, 19.71953773498535, 21.249876022338867, 22.780216217041016, 24.31055450439453, 25.840892791748047, 27.371231079101562, 28.901569366455078, 30.431909561157227, 31.962247848510742, 33.49258804321289, 35.022926330566406, 36.55326461791992, 38.08360290527344, 39.61394119262695, 41.14427947998047, 42.674617767333984, 44.2049560546875, 45.73529815673828, 47.2656364440918, 48.79597473144531, 50.32631301879883]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 4.0, 4.0, 6.0, 5.0, 5.0, 12.0, 11.0, 12.0, 20.0, 20.0, 23.0, 22.0, 33.0, 34.0, 27.0, 31.0, 29.0, 33.0, 38.0, 33.0, 30.0, 35.0, 30.0, 36.0, 36.0, 31.0, 25.0, 41.0, 33.0, 39.0, 38.0, 21.0, 33.0, 21.0, 32.0, 26.0, 16.0, 8.0, 11.0, 11.0, 10.0, 6.0, 2.0, 4.0, 3.0, 4.0, 5.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-29.345109939575195, -28.46778678894043, -27.590463638305664, -26.7131404876709, -25.835817337036133, -24.958492279052734, -24.08116912841797, -23.203845977783203, -22.326522827148438, -21.449199676513672, -20.571876525878906, -19.69455337524414, -18.817230224609375, -17.93990707397461, -17.062583923339844, -16.185258865356445, -15.307936668395996, -14.43061351776123, -13.553290367126465, -12.675966262817383, -11.798643112182617, -10.921319961547852, -10.043996810913086, -9.16667366027832, -8.289350509643555, -7.412027359008789, -6.534703731536865, -5.6573805809021, -4.780056953430176, -3.90273380279541, -3.0254106521606445, -2.1480870246887207, -1.2707633972167969, -0.3934400677680969, 0.483883261680603, 1.3612065315246582, 2.238529920578003, 3.1158533096313477, 3.9931764602661133, 4.870500087738037, 5.747823238372803, 6.625146389007568, 7.502470016479492, 8.379793167114258, 9.257116317749023, 10.134439468383789, 11.011762619018555, 11.889086723327637, 12.766409873962402, 13.643733024597168, 14.521056175231934, 15.398380279541016, 16.27570343017578, 17.153026580810547, 18.030349731445312, 18.907672882080078, 19.784996032714844, 20.66231918334961, 21.539642333984375, 22.41696548461914, 23.294288635253906, 24.171611785888672, 25.048934936523438, 25.926259994506836, 26.8035831451416]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 6.0, 1.0, 7.0, 6.0, 15.0, 15.0, 27.0, 27.0, 36.0, 67.0, 57.0, 85.0, 133.0, 199.0, 330.0, 437.0, 681.0, 1118.0, 1804.0, 3034.0, 5208.0, 8790.0, 15562.0, 27337.0, 48217.0, 85189.0, 149811.0, 234514.0, 198809.0, 114645.0, 65109.0, 36989.0, 21038.0, 11822.0, 6703.0, 4112.0, 2394.0, 1472.0, 901.0, 592.0, 394.0, 242.0, 189.0, 116.0, 98.0, 60.0, 47.0, 32.0, 27.0, 21.0, 16.0, 9.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-50.75, -49.15234375, -47.5546875, -45.95703125, -44.359375, -42.76171875, -41.1640625, -39.56640625, -37.96875, -36.37109375, -34.7734375, -33.17578125, -31.578125, -29.98046875, -28.3828125, -26.78515625, -25.1875, -23.58984375, -21.9921875, -20.39453125, -18.796875, -17.19921875, -15.6015625, -14.00390625, -12.40625, -10.80859375, -9.2109375, -7.61328125, -6.015625, -4.41796875, -2.8203125, -1.22265625, 0.375, 1.97265625, 3.5703125, 5.16796875, 6.765625, 8.36328125, 9.9609375, 11.55859375, 13.15625, 14.75390625, 16.3515625, 17.94921875, 19.546875, 21.14453125, 22.7421875, 24.33984375, 25.9375, 27.53515625, 29.1328125, 30.73046875, 32.328125, 33.92578125, 35.5234375, 37.12109375, 38.71875, 40.31640625, 41.9140625, 43.51171875, 45.109375, 46.70703125, 48.3046875, 49.90234375, 51.5]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 0.0, 2.0, 5.0, 2.0, 4.0, 7.0, 4.0, 2.0, 8.0, 5.0, 7.0, 9.0, 8.0, 14.0, 15.0, 19.0, 25.0, 27.0, 23.0, 25.0, 34.0, 37.0, 28.0, 28.0, 36.0, 33.0, 33.0, 29.0, 34.0, 31.0, 33.0, 33.0, 39.0, 38.0, 23.0, 26.0, 33.0, 43.0, 31.0, 27.0, 20.0, 28.0, 20.0, 18.0, 17.0, 13.0, 6.0, 2.0, 8.0, 2.0, 4.0, 3.0, 3.0, 5.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-24.0625, -23.3291015625, -22.595703125, -21.8623046875, -21.12890625, -20.3955078125, -19.662109375, -18.9287109375, -18.1953125, -17.4619140625, -16.728515625, -15.9951171875, -15.26171875, -14.5283203125, -13.794921875, -13.0615234375, -12.328125, -11.5947265625, -10.861328125, -10.1279296875, -9.39453125, -8.6611328125, -7.927734375, -7.1943359375, -6.4609375, -5.7275390625, -4.994140625, -4.2607421875, -3.52734375, -2.7939453125, -2.060546875, -1.3271484375, -0.59375, 0.1396484375, 0.873046875, 1.6064453125, 2.33984375, 3.0732421875, 3.806640625, 4.5400390625, 5.2734375, 6.0068359375, 6.740234375, 7.4736328125, 8.20703125, 8.9404296875, 9.673828125, 10.4072265625, 11.140625, 11.8740234375, 12.607421875, 13.3408203125, 14.07421875, 14.8076171875, 15.541015625, 16.2744140625, 17.0078125, 17.7412109375, 18.474609375, 19.2080078125, 19.94140625, 20.6748046875, 21.408203125, 22.1416015625, 22.875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 3.0, 1.0, 7.0, 12.0, 13.0, 17.0, 20.0, 26.0, 52.0, 64.0, 134.0, 144.0, 246.0, 370.0, 510.0, 762.0, 1184.0, 1718.0, 2613.0, 3839.0, 5835.0, 8809.0, 13352.0, 20299.0, 32917.0, 52752.0, 88961.0, 152308.0, 225226.0, 171863.0, 101291.0, 59943.0, 36479.0, 23054.0, 14639.0, 9661.0, 6331.0, 4296.0, 2841.0, 1929.0, 1354.0, 877.0, 530.0, 408.0, 288.0, 188.0, 104.0, 90.0, 55.0, 37.0, 31.0, 29.0, 12.0, 7.0, 16.0, 5.0, 9.0, 1.0, 0.0, 4.0, 4.0], "bins": [-41.78125, -40.4599609375, -39.138671875, -37.8173828125, -36.49609375, -35.1748046875, -33.853515625, -32.5322265625, -31.2109375, -29.8896484375, -28.568359375, -27.2470703125, -25.92578125, -24.6044921875, -23.283203125, -21.9619140625, -20.640625, -19.3193359375, -17.998046875, -16.6767578125, -15.35546875, -14.0341796875, -12.712890625, -11.3916015625, -10.0703125, -8.7490234375, -7.427734375, -6.1064453125, -4.78515625, -3.4638671875, -2.142578125, -0.8212890625, 0.5, 1.8212890625, 3.142578125, 4.4638671875, 5.78515625, 7.1064453125, 8.427734375, 9.7490234375, 11.0703125, 12.3916015625, 13.712890625, 15.0341796875, 16.35546875, 17.6767578125, 18.998046875, 20.3193359375, 21.640625, 22.9619140625, 24.283203125, 25.6044921875, 26.92578125, 28.2470703125, 29.568359375, 30.8896484375, 32.2109375, 33.5322265625, 34.853515625, 36.1748046875, 37.49609375, 38.8173828125, 40.138671875, 41.4599609375, 42.78125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 5.0, 9.0, 6.0, 6.0, 9.0, 26.0, 10.0, 25.0, 9.0, 27.0, 27.0, 28.0, 30.0, 30.0, 44.0, 45.0, 55.0, 54.0, 50.0, 40.0, 43.0, 55.0, 60.0, 43.0, 36.0, 31.0, 28.0, 27.0, 31.0, 23.0, 19.0, 17.0, 11.0, 13.0, 9.0, 9.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.859375, -21.14501953125, -20.4306640625, -19.71630859375, -19.001953125, -18.28759765625, -17.5732421875, -16.85888671875, -16.14453125, -15.43017578125, -14.7158203125, -14.00146484375, -13.287109375, -12.57275390625, -11.8583984375, -11.14404296875, -10.4296875, -9.71533203125, -9.0009765625, -8.28662109375, -7.572265625, -6.85791015625, -6.1435546875, -5.42919921875, -4.71484375, -4.00048828125, -3.2861328125, -2.57177734375, -1.857421875, -1.14306640625, -0.4287109375, 0.28564453125, 1.0, 1.71435546875, 2.4287109375, 3.14306640625, 3.857421875, 4.57177734375, 5.2861328125, 6.00048828125, 6.71484375, 7.42919921875, 8.1435546875, 8.85791015625, 9.572265625, 10.28662109375, 11.0009765625, 11.71533203125, 12.4296875, 13.14404296875, 13.8583984375, 14.57275390625, 15.287109375, 16.00146484375, 16.7158203125, 17.43017578125, 18.14453125, 18.85888671875, 19.5732421875, 20.28759765625, 21.001953125, 21.71630859375, 22.4306640625, 23.14501953125, 23.859375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 11.0, 13.0, 24.0, 26.0, 35.0, 48.0, 63.0, 107.0, 144.0, 205.0, 273.0, 372.0, 549.0, 780.0, 1352.0, 2274.0, 4277.0, 9009.0, 26317.0, 129538.0, 741502.0, 92568.0, 21686.0, 7857.0, 3725.0, 2022.0, 1247.0, 786.0, 487.0, 356.0, 246.0, 174.0, 136.0, 85.0, 89.0, 48.0, 38.0, 21.0, 16.0, 13.0, 10.0, 4.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.9375, -113.0927734375, -109.248046875, -105.4033203125, -101.55859375, -97.7138671875, -93.869140625, -90.0244140625, -86.1796875, -82.3349609375, -78.490234375, -74.6455078125, -70.80078125, -66.9560546875, -63.111328125, -59.2666015625, -55.421875, -51.5771484375, -47.732421875, -43.8876953125, -40.04296875, -36.1982421875, -32.353515625, -28.5087890625, -24.6640625, -20.8193359375, -16.974609375, -13.1298828125, -9.28515625, -5.4404296875, -1.595703125, 2.2490234375, 6.09375, 9.9384765625, 13.783203125, 17.6279296875, 21.47265625, 25.3173828125, 29.162109375, 33.0068359375, 36.8515625, 40.6962890625, 44.541015625, 48.3857421875, 52.23046875, 56.0751953125, 59.919921875, 63.7646484375, 67.609375, 71.4541015625, 75.298828125, 79.1435546875, 82.98828125, 86.8330078125, 90.677734375, 94.5224609375, 98.3671875, 102.2119140625, 106.056640625, 109.9013671875, 113.74609375, 117.5908203125, 121.435546875, 125.2802734375, 129.125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 5.0, 11.0, 18.0, 24.0, 60.0, 142.0, 321.0, 206.0, 87.0, 51.0, 24.0, 16.0, 11.0, 6.0, 5.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004058837890625, -0.0038633346557617188, -0.0036678314208984375, -0.0034723281860351562, -0.003276824951171875, -0.0030813217163085938, -0.0028858184814453125, -0.0026903152465820312, -0.00249481201171875, -0.0022993087768554688, -0.0021038055419921875, -0.0019083023071289062, -0.001712799072265625, -0.0015172958374023438, -0.0013217926025390625, -0.0011262893676757812, -0.0009307861328125, -0.0007352828979492188, -0.0005397796630859375, -0.00034427642822265625, -0.000148773193359375, 4.673004150390625e-05, 0.0002422332763671875, 0.00043773651123046875, 0.00063323974609375, 0.0008287429809570312, 0.0010242462158203125, 0.0012197494506835938, 0.001415252685546875, 0.0016107559204101562, 0.0018062591552734375, 0.0020017623901367188, 0.002197265625, 0.0023927688598632812, 0.0025882720947265625, 0.0027837753295898438, 0.002979278564453125, 0.0031747817993164062, 0.0033702850341796875, 0.0035657882690429688, 0.00376129150390625, 0.003956794738769531, 0.0041522979736328125, 0.004347801208496094, 0.004543304443359375, 0.004738807678222656, 0.0049343109130859375, 0.005129814147949219, 0.0053253173828125, 0.005520820617675781, 0.0057163238525390625, 0.005911827087402344, 0.006107330322265625, 0.006302833557128906, 0.0064983367919921875, 0.006693840026855469, 0.00688934326171875, 0.007084846496582031, 0.0072803497314453125, 0.007475852966308594, 0.007671356201171875, 0.007866859436035156, 0.008062362670898438, 0.008257865905761719, 0.008453369140625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 5.0, 3.0, 2.0, 3.0, 9.0, 18.0, 18.0, 13.0, 23.0, 24.0, 39.0, 52.0, 97.0, 106.0, 160.0, 217.0, 316.0, 478.0, 738.0, 1060.0, 1619.0, 2693.0, 4776.0, 9442.0, 23353.0, 81659.0, 683750.0, 172886.0, 36340.0, 13254.0, 6104.0, 3341.0, 1989.0, 1271.0, 833.0, 541.0, 413.0, 244.0, 200.0, 130.0, 89.0, 75.0, 62.0, 23.0, 30.0, 13.0, 16.0, 11.0, 8.0, 6.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-96.5625, -93.3115234375, -90.060546875, -86.8095703125, -83.55859375, -80.3076171875, -77.056640625, -73.8056640625, -70.5546875, -67.3037109375, -64.052734375, -60.8017578125, -57.55078125, -54.2998046875, -51.048828125, -47.7978515625, -44.546875, -41.2958984375, -38.044921875, -34.7939453125, -31.54296875, -28.2919921875, -25.041015625, -21.7900390625, -18.5390625, -15.2880859375, -12.037109375, -8.7861328125, -5.53515625, -2.2841796875, 0.966796875, 4.2177734375, 7.46875, 10.7197265625, 13.970703125, 17.2216796875, 20.47265625, 23.7236328125, 26.974609375, 30.2255859375, 33.4765625, 36.7275390625, 39.978515625, 43.2294921875, 46.48046875, 49.7314453125, 52.982421875, 56.2333984375, 59.484375, 62.7353515625, 65.986328125, 69.2373046875, 72.48828125, 75.7392578125, 78.990234375, 82.2412109375, 85.4921875, 88.7431640625, 91.994140625, 95.2451171875, 98.49609375, 101.7470703125, 104.998046875, 108.2490234375, 111.5]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 5.0, 6.0, 4.0, 4.0, 6.0, 3.0, 16.0, 15.0, 29.0, 33.0, 62.0, 91.0, 154.0, 209.0, 126.0, 82.0, 53.0, 34.0, 21.0, 17.0, 7.0, 4.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-34.84375, -33.88623046875, -32.9287109375, -31.97119140625, -31.013671875, -30.05615234375, -29.0986328125, -28.14111328125, -27.18359375, -26.22607421875, -25.2685546875, -24.31103515625, -23.353515625, -22.39599609375, -21.4384765625, -20.48095703125, -19.5234375, -18.56591796875, -17.6083984375, -16.65087890625, -15.693359375, -14.73583984375, -13.7783203125, -12.82080078125, -11.86328125, -10.90576171875, -9.9482421875, -8.99072265625, -8.033203125, -7.07568359375, -6.1181640625, -5.16064453125, -4.203125, -3.24560546875, -2.2880859375, -1.33056640625, -0.373046875, 0.58447265625, 1.5419921875, 2.49951171875, 3.45703125, 4.41455078125, 5.3720703125, 6.32958984375, 7.287109375, 8.24462890625, 9.2021484375, 10.15966796875, 11.1171875, 12.07470703125, 13.0322265625, 13.98974609375, 14.947265625, 15.90478515625, 16.8623046875, 17.81982421875, 18.77734375, 19.73486328125, 20.6923828125, 21.64990234375, 22.607421875, 23.56494140625, 24.5224609375, 25.47998046875, 26.4375]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 5.0, 12.0, 25.0, 19.0, 27.0, 49.0, 76.0, 113.0, 143.0, 133.0, 98.0, 63.0, 46.0, 38.0, 34.0, 30.0, 17.0, 20.0, 7.0, 12.0, 7.0, 9.0, 3.0, 4.0, 0.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.62872314453125, -49.985801696777344, -48.34288024902344, -46.699954986572266, -45.05703353881836, -43.41411209106445, -41.77118682861328, -40.128265380859375, -38.48534393310547, -36.84242248535156, -35.199501037597656, -33.556575775146484, -31.913654327392578, -30.270732879638672, -28.627809524536133, -26.984886169433594, -25.341964721679688, -23.69904327392578, -22.056119918823242, -20.413196563720703, -18.770275115966797, -17.12735366821289, -15.484430313110352, -13.841507911682129, -12.198585510253906, -10.555663108825684, -8.912740707397461, -7.269818305969238, -5.626895904541016, -3.983973503112793, -2.3410511016845703, -0.6981287002563477, 0.944793701171875, 2.5877161026000977, 4.23063850402832, 5.873560905456543, 7.516483306884766, 9.159405708312988, 10.802328109741211, 12.445250511169434, 14.088172912597656, 15.731095314025879, 17.3740177154541, 19.01694107055664, 20.659862518310547, 22.302783966064453, 23.945707321166992, 25.58863067626953, 27.231552124023438, 28.874473571777344, 30.517396926879883, 32.16032028198242, 33.80324172973633, 35.446163177490234, 37.089088439941406, 38.73200988769531, 40.37493133544922, 42.017852783203125, 43.66077423095703, 45.3036994934082, 46.94662094116211, 48.589542388916016, 50.23246765136719, 51.875389099121094, 53.518310546875]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 2.0, 3.0, 5.0, 12.0, 4.0, 8.0, 12.0, 4.0, 12.0, 8.0, 16.0, 22.0, 28.0, 23.0, 26.0, 26.0, 39.0, 38.0, 39.0, 42.0, 41.0, 49.0, 42.0, 44.0, 45.0, 40.0, 31.0, 44.0, 34.0, 47.0, 32.0, 32.0, 34.0, 24.0, 23.0, 21.0, 12.0, 8.0, 14.0, 8.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-35.08091735839844, -34.04567337036133, -33.01042938232422, -31.97518539428711, -30.939943313598633, -29.904699325561523, -28.869455337524414, -27.834211349487305, -26.798969268798828, -25.76372528076172, -24.72848129272461, -23.6932373046875, -22.657995223999023, -21.622751235961914, -20.587507247924805, -19.552263259887695, -18.517019271850586, -17.481775283813477, -16.446531295776367, -15.411288261413574, -14.376045227050781, -13.340801239013672, -12.305557250976562, -11.270313262939453, -10.23507022857666, -9.19982624053955, -8.164583206176758, -7.129339218139648, -6.094095706939697, -5.058852195739746, -4.023608207702637, -2.9883646965026855, -1.9531192779541016, -0.9178756475448608, 0.11736798286437988, 1.1526117324829102, 2.1878552436828613, 3.2230987548828125, 4.258342742919922, 5.293586254119873, 6.328829765319824, 7.364073276519775, 8.399316787719727, 9.434560775756836, 10.469804763793945, 11.505047798156738, 12.540291786193848, 13.57553482055664, 14.61077880859375, 15.64602279663086, 16.68126678466797, 17.716510772705078, 18.751752853393555, 19.786996841430664, 20.822240829467773, 21.857484817504883, 22.89272689819336, 23.92797088623047, 24.963214874267578, 25.998458862304688, 27.033700942993164, 28.068944931030273, 29.104188919067383, 30.139432907104492, 31.1746768951416]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 5.0, 10.0, 12.0, 8.0, 41.0, 55.0, 63.0, 118.0, 175.0, 235.0, 381.0, 513.0, 715.0, 1030.0, 1535.0, 2185.0, 3281.0, 5033.0, 7678.0, 11632.0, 18628.0, 31070.0, 54697.0, 103316.0, 226228.0, 870371.0, 1886872.0, 568216.0, 191273.0, 90923.0, 48047.0, 27195.0, 15955.0, 9831.0, 6098.0, 3762.0, 2493.0, 1594.0, 1063.0, 638.0, 415.0, 287.0, 190.0, 104.0, 93.0, 60.0, 47.0, 33.0, 22.0, 20.0, 19.0, 8.0, 6.0, 6.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-35.96875, -34.70068359375, -33.4326171875, -32.16455078125, -30.896484375, -29.62841796875, -28.3603515625, -27.09228515625, -25.82421875, -24.55615234375, -23.2880859375, -22.02001953125, -20.751953125, -19.48388671875, -18.2158203125, -16.94775390625, -15.6796875, -14.41162109375, -13.1435546875, -11.87548828125, -10.607421875, -9.33935546875, -8.0712890625, -6.80322265625, -5.53515625, -4.26708984375, -2.9990234375, -1.73095703125, -0.462890625, 0.80517578125, 2.0732421875, 3.34130859375, 4.609375, 5.87744140625, 7.1455078125, 8.41357421875, 9.681640625, 10.94970703125, 12.2177734375, 13.48583984375, 14.75390625, 16.02197265625, 17.2900390625, 18.55810546875, 19.826171875, 21.09423828125, 22.3623046875, 23.63037109375, 24.8984375, 26.16650390625, 27.4345703125, 28.70263671875, 29.970703125, 31.23876953125, 32.5068359375, 33.77490234375, 35.04296875, 36.31103515625, 37.5791015625, 38.84716796875, 40.115234375, 41.38330078125, 42.6513671875, 43.91943359375, 45.1875]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 2.0, 1.0, 7.0, 4.0, 2.0, 8.0, 11.0, 15.0, 16.0, 12.0, 26.0, 17.0, 26.0, 45.0, 34.0, 34.0, 40.0, 44.0, 38.0, 43.0, 42.0, 60.0, 47.0, 59.0, 39.0, 49.0, 38.0, 28.0, 36.0, 41.0, 29.0, 23.0, 22.0, 11.0, 14.0, 15.0, 9.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.8125, -20.220458984375, -19.62841796875, -19.036376953125, -18.4443359375, -17.852294921875, -17.26025390625, -16.668212890625, -16.076171875, -15.484130859375, -14.89208984375, -14.300048828125, -13.7080078125, -13.115966796875, -12.52392578125, -11.931884765625, -11.33984375, -10.747802734375, -10.15576171875, -9.563720703125, -8.9716796875, -8.379638671875, -7.78759765625, -7.195556640625, -6.603515625, -6.011474609375, -5.41943359375, -4.827392578125, -4.2353515625, -3.643310546875, -3.05126953125, -2.459228515625, -1.8671875, -1.275146484375, -0.68310546875, -0.091064453125, 0.5009765625, 1.093017578125, 1.68505859375, 2.277099609375, 2.869140625, 3.461181640625, 4.05322265625, 4.645263671875, 5.2373046875, 5.829345703125, 6.42138671875, 7.013427734375, 7.60546875, 8.197509765625, 8.78955078125, 9.381591796875, 9.9736328125, 10.565673828125, 11.15771484375, 11.749755859375, 12.341796875, 12.933837890625, 13.52587890625, 14.117919921875, 14.7099609375, 15.302001953125, 15.89404296875, 16.486083984375, 17.078125]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 7.0, 10.0, 11.0, 23.0, 36.0, 42.0, 57.0, 124.0, 138.0, 291.0, 447.0, 835.0, 1465.0, 2757.0, 5284.0, 10215.0, 22541.0, 51915.0, 139892.0, 486318.0, 2320255.0, 821413.0, 203035.0, 70770.0, 29126.0, 13275.0, 6374.0, 3455.0, 1750.0, 1001.0, 579.0, 304.0, 215.0, 110.0, 75.0, 48.0, 34.0, 13.0, 12.0, 7.0, 13.0, 1.0, 5.0, 0.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.40625, -45.80810546875, -44.2099609375, -42.61181640625, -41.013671875, -39.41552734375, -37.8173828125, -36.21923828125, -34.62109375, -33.02294921875, -31.4248046875, -29.82666015625, -28.228515625, -26.63037109375, -25.0322265625, -23.43408203125, -21.8359375, -20.23779296875, -18.6396484375, -17.04150390625, -15.443359375, -13.84521484375, -12.2470703125, -10.64892578125, -9.05078125, -7.45263671875, -5.8544921875, -4.25634765625, -2.658203125, -1.06005859375, 0.5380859375, 2.13623046875, 3.734375, 5.33251953125, 6.9306640625, 8.52880859375, 10.126953125, 11.72509765625, 13.3232421875, 14.92138671875, 16.51953125, 18.11767578125, 19.7158203125, 21.31396484375, 22.912109375, 24.51025390625, 26.1083984375, 27.70654296875, 29.3046875, 30.90283203125, 32.5009765625, 34.09912109375, 35.697265625, 37.29541015625, 38.8935546875, 40.49169921875, 42.08984375, 43.68798828125, 45.2861328125, 46.88427734375, 48.482421875, 50.08056640625, 51.6787109375, 53.27685546875, 54.875]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 10.0, 5.0, 8.0, 19.0, 17.0, 10.0, 26.0, 44.0, 45.0, 69.0, 81.0, 140.0, 181.0, 198.0, 278.0, 358.0, 503.0, 544.0, 375.0, 295.0, 202.0, 184.0, 140.0, 92.0, 76.0, 39.0, 45.0, 32.0, 18.0, 19.0, 8.0, 8.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.765625, -15.363525390625, -14.96142578125, -14.559326171875, -14.1572265625, -13.755126953125, -13.35302734375, -12.950927734375, -12.548828125, -12.146728515625, -11.74462890625, -11.342529296875, -10.9404296875, -10.538330078125, -10.13623046875, -9.734130859375, -9.33203125, -8.929931640625, -8.52783203125, -8.125732421875, -7.7236328125, -7.321533203125, -6.91943359375, -6.517333984375, -6.115234375, -5.713134765625, -5.31103515625, -4.908935546875, -4.5068359375, -4.104736328125, -3.70263671875, -3.300537109375, -2.8984375, -2.496337890625, -2.09423828125, -1.692138671875, -1.2900390625, -0.887939453125, -0.48583984375, -0.083740234375, 0.318359375, 0.720458984375, 1.12255859375, 1.524658203125, 1.9267578125, 2.328857421875, 2.73095703125, 3.133056640625, 3.53515625, 3.937255859375, 4.33935546875, 4.741455078125, 5.1435546875, 5.545654296875, 5.94775390625, 6.349853515625, 6.751953125, 7.154052734375, 7.55615234375, 7.958251953125, 8.3603515625, 8.762451171875, 9.16455078125, 9.566650390625, 9.96875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 4.0, 3.0, 8.0, 4.0, 14.0, 14.0, 12.0, 26.0, 39.0, 48.0, 72.0, 75.0, 97.0, 118.0, 106.0, 77.0, 59.0, 39.0, 43.0, 28.0, 16.0, 19.0, 12.0, 9.0, 7.0, 8.0, 8.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-31.38177490234375, -30.500268936157227, -29.618762969970703, -28.73725700378418, -27.855751037597656, -26.974246978759766, -26.092741012573242, -25.21123504638672, -24.329729080200195, -23.448223114013672, -22.56671714782715, -21.685211181640625, -20.803707122802734, -19.922199249267578, -19.040695190429688, -18.159189224243164, -17.27768325805664, -16.396177291870117, -15.514671325683594, -14.633166313171387, -13.751660346984863, -12.87015438079834, -11.988649368286133, -11.10714340209961, -10.225637435913086, -9.344131469726562, -8.462625503540039, -7.581120491027832, -6.699614524841309, -5.818108558654785, -4.93660306930542, -4.055097579956055, -3.1735897064208984, -2.292083978652954, -1.4105782508850098, -0.5290725231170654, 0.3524332046508789, 1.2339391708374023, 2.1154446601867676, 2.996950149536133, 3.8784561157226562, 4.75996208190918, 5.641467571258545, 6.52297306060791, 7.404479026794434, 8.285984992980957, 9.167490005493164, 10.048995971679688, 10.930501937866211, 11.812007904052734, 12.693513870239258, 13.575018882751465, 14.456524848937988, 15.338030815124512, 16.21953582763672, 17.101041793823242, 17.982547760009766, 18.86405372619629, 19.745559692382812, 20.627065658569336, 21.50857162475586, 22.39007568359375, 23.271581649780273, 24.153087615966797, 25.03459358215332]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 7.0, 7.0, 5.0, 14.0, 11.0, 8.0, 13.0, 13.0, 21.0, 22.0, 22.0, 30.0, 29.0, 30.0, 30.0, 37.0, 44.0, 41.0, 54.0, 46.0, 56.0, 36.0, 47.0, 41.0, 42.0, 37.0, 34.0, 35.0, 34.0, 34.0, 35.0, 23.0, 14.0, 10.0, 12.0, 10.0, 5.0, 6.0, 4.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-24.622703552246094, -23.956533432006836, -23.29036521911621, -22.624195098876953, -21.958024978637695, -21.291854858398438, -20.625686645507812, -19.959516525268555, -19.293346405029297, -18.62717628479004, -17.961008071899414, -17.294837951660156, -16.6286678314209, -15.962498664855957, -15.296329498291016, -14.630159378051758, -13.963991165161133, -13.297821998596191, -12.631651878356934, -11.965482711791992, -11.299312591552734, -10.633143424987793, -9.966974258422852, -9.300804138183594, -8.634634971618652, -7.968465328216553, -7.302295684814453, -6.636126518249512, -5.969956874847412, -5.3037872314453125, -4.637618064880371, -3.9714484214782715, -3.305276870727539, -2.6391072273254395, -1.972937822341919, -1.3067682981491089, -0.6405987739562988, 0.02557086944580078, 0.6917402744293213, 1.3579096794128418, 2.0240793228149414, 2.690248966217041, 3.3564183712005615, 4.022587776184082, 4.688757419586182, 5.354927062988281, 6.021096229553223, 6.687265872955322, 7.353435516357422, 8.019604682922363, 8.685774803161621, 9.351943969726562, 10.01811408996582, 10.684283256530762, 11.350452423095703, 12.016622543334961, 12.682791709899902, 13.348960876464844, 14.015130996704102, 14.681300163269043, 15.347469329833984, 16.013639450073242, 16.6798095703125, 17.345977783203125, 18.012147903442383]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 9.0, 17.0, 14.0, 26.0, 36.0, 65.0, 62.0, 84.0, 130.0, 161.0, 259.0, 373.0, 539.0, 851.0, 1279.0, 1879.0, 2887.0, 4530.0, 7029.0, 11770.0, 19844.0, 34558.0, 64097.0, 127711.0, 290197.0, 240883.0, 107520.0, 55196.0, 30306.0, 17599.0, 10336.0, 6491.0, 3978.0, 2639.0, 1635.0, 1108.0, 787.0, 526.0, 355.0, 239.0, 168.0, 117.0, 82.0, 61.0, 35.0, 23.0, 22.0, 14.0, 12.0, 8.0, 4.0, 8.0, 3.0, 2.0, 1.0, 1.0], "bins": [-9.453125, -9.1656494140625, -8.878173828125, -8.5906982421875, -8.30322265625, -8.0157470703125, -7.728271484375, -7.4407958984375, -7.1533203125, -6.8658447265625, -6.578369140625, -6.2908935546875, -6.00341796875, -5.7159423828125, -5.428466796875, -5.1409912109375, -4.853515625, -4.5660400390625, -4.278564453125, -3.9910888671875, -3.70361328125, -3.4161376953125, -3.128662109375, -2.8411865234375, -2.5537109375, -2.2662353515625, -1.978759765625, -1.6912841796875, -1.40380859375, -1.1163330078125, -0.828857421875, -0.5413818359375, -0.25390625, 0.0335693359375, 0.321044921875, 0.6085205078125, 0.89599609375, 1.1834716796875, 1.470947265625, 1.7584228515625, 2.0458984375, 2.3333740234375, 2.620849609375, 2.9083251953125, 3.19580078125, 3.4832763671875, 3.770751953125, 4.0582275390625, 4.345703125, 4.6331787109375, 4.920654296875, 5.2081298828125, 5.49560546875, 5.7830810546875, 6.070556640625, 6.3580322265625, 6.6455078125, 6.9329833984375, 7.220458984375, 7.5079345703125, 7.79541015625, 8.0828857421875, 8.370361328125, 8.6578369140625, 8.9453125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 3.0, 8.0, 5.0, 8.0, 9.0, 12.0, 18.0, 19.0, 15.0, 29.0, 32.0, 26.0, 35.0, 37.0, 35.0, 43.0, 41.0, 57.0, 55.0, 44.0, 42.0, 44.0, 41.0, 39.0, 35.0, 53.0, 34.0, 40.0, 30.0, 29.0, 20.0, 16.0, 15.0, 5.0, 5.0, 5.0, 6.0, 6.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-25.875, -25.177490234375, -24.47998046875, -23.782470703125, -23.0849609375, -22.387451171875, -21.68994140625, -20.992431640625, -20.294921875, -19.597412109375, -18.89990234375, -18.202392578125, -17.5048828125, -16.807373046875, -16.10986328125, -15.412353515625, -14.71484375, -14.017333984375, -13.31982421875, -12.622314453125, -11.9248046875, -11.227294921875, -10.52978515625, -9.832275390625, -9.134765625, -8.437255859375, -7.73974609375, -7.042236328125, -6.3447265625, -5.647216796875, -4.94970703125, -4.252197265625, -3.5546875, -2.857177734375, -2.15966796875, -1.462158203125, -0.7646484375, -0.067138671875, 0.63037109375, 1.327880859375, 2.025390625, 2.722900390625, 3.42041015625, 4.117919921875, 4.8154296875, 5.512939453125, 6.21044921875, 6.907958984375, 7.60546875, 8.302978515625, 9.00048828125, 9.697998046875, 10.3955078125, 11.093017578125, 11.79052734375, 12.488037109375, 13.185546875, 13.883056640625, 14.58056640625, 15.278076171875, 15.9755859375, 16.673095703125, 17.37060546875, 18.068115234375, 18.765625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 5.0, 7.0, 4.0, 6.0, 12.0, 16.0, 25.0, 35.0, 51.0, 75.0, 114.0, 149.0, 217.0, 321.0, 444.0, 600.0, 935.0, 1223.0, 1923.0, 2944.0, 4515.0, 7382.0, 12525.0, 22767.0, 43040.0, 92726.0, 242886.0, 361401.0, 126724.0, 56570.0, 28696.0, 15598.0, 8769.0, 5488.0, 3494.0, 2181.0, 1442.0, 935.0, 691.0, 480.0, 287.0, 239.0, 160.0, 126.0, 82.0, 70.0, 48.0, 39.0, 18.0, 25.0, 12.0, 11.0, 14.0, 11.0, 2.0, 6.0, 0.0, 2.0, 3.0], "bins": [-10.3046875, -9.9844970703125, -9.664306640625, -9.3441162109375, -9.02392578125, -8.7037353515625, -8.383544921875, -8.0633544921875, -7.7431640625, -7.4229736328125, -7.102783203125, -6.7825927734375, -6.46240234375, -6.1422119140625, -5.822021484375, -5.5018310546875, -5.181640625, -4.8614501953125, -4.541259765625, -4.2210693359375, -3.90087890625, -3.5806884765625, -3.260498046875, -2.9403076171875, -2.6201171875, -2.2999267578125, -1.979736328125, -1.6595458984375, -1.33935546875, -1.0191650390625, -0.698974609375, -0.3787841796875, -0.05859375, 0.2615966796875, 0.581787109375, 0.9019775390625, 1.22216796875, 1.5423583984375, 1.862548828125, 2.1827392578125, 2.5029296875, 2.8231201171875, 3.143310546875, 3.4635009765625, 3.78369140625, 4.1038818359375, 4.424072265625, 4.7442626953125, 5.064453125, 5.3846435546875, 5.704833984375, 6.0250244140625, 6.34521484375, 6.6654052734375, 6.985595703125, 7.3057861328125, 7.6259765625, 7.9461669921875, 8.266357421875, 8.5865478515625, 8.90673828125, 9.2269287109375, 9.547119140625, 9.8673095703125, 10.1875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 0.0, 4.0, 5.0, 6.0, 9.0, 10.0, 10.0, 8.0, 21.0, 16.0, 18.0, 24.0, 29.0, 27.0, 31.0, 35.0, 35.0, 28.0, 35.0, 39.0, 33.0, 43.0, 48.0, 60.0, 40.0, 44.0, 38.0, 43.0, 39.0, 30.0, 20.0, 23.0, 28.0, 23.0, 25.0, 10.0, 11.0, 10.0, 8.0, 13.0, 8.0, 4.0, 6.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-15.1015625, -14.6854248046875, -14.269287109375, -13.8531494140625, -13.43701171875, -13.0208740234375, -12.604736328125, -12.1885986328125, -11.7724609375, -11.3563232421875, -10.940185546875, -10.5240478515625, -10.10791015625, -9.6917724609375, -9.275634765625, -8.8594970703125, -8.443359375, -8.0272216796875, -7.611083984375, -7.1949462890625, -6.77880859375, -6.3626708984375, -5.946533203125, -5.5303955078125, -5.1142578125, -4.6981201171875, -4.281982421875, -3.8658447265625, -3.44970703125, -3.0335693359375, -2.617431640625, -2.2012939453125, -1.78515625, -1.3690185546875, -0.952880859375, -0.5367431640625, -0.12060546875, 0.2955322265625, 0.711669921875, 1.1278076171875, 1.5439453125, 1.9600830078125, 2.376220703125, 2.7923583984375, 3.20849609375, 3.6246337890625, 4.040771484375, 4.4569091796875, 4.873046875, 5.2891845703125, 5.705322265625, 6.1214599609375, 6.53759765625, 6.9537353515625, 7.369873046875, 7.7860107421875, 8.2021484375, 8.6182861328125, 9.034423828125, 9.4505615234375, 9.86669921875, 10.2828369140625, 10.698974609375, 11.1151123046875, 11.53125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 6.0, 3.0, 8.0, 10.0, 13.0, 25.0, 27.0, 33.0, 47.0, 57.0, 79.0, 102.0, 151.0, 247.0, 343.0, 493.0, 625.0, 895.0, 1324.0, 1974.0, 2931.0, 4480.0, 7181.0, 11689.0, 20372.0, 37700.0, 79511.0, 226072.0, 422752.0, 114411.0, 49928.0, 25538.0, 14611.0, 8491.0, 5533.0, 3541.0, 2172.0, 1495.0, 1098.0, 747.0, 504.0, 369.0, 279.0, 188.0, 148.0, 100.0, 79.0, 56.0, 43.0, 21.0, 19.0, 11.0, 12.0, 6.0, 4.0, 6.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-2.20703125, -2.13629150390625, -2.0655517578125, -1.99481201171875, -1.924072265625, -1.85333251953125, -1.7825927734375, -1.71185302734375, -1.64111328125, -1.57037353515625, -1.4996337890625, -1.42889404296875, -1.358154296875, -1.28741455078125, -1.2166748046875, -1.14593505859375, -1.0751953125, -1.00445556640625, -0.9337158203125, -0.86297607421875, -0.792236328125, -0.72149658203125, -0.6507568359375, -0.58001708984375, -0.50927734375, -0.43853759765625, -0.3677978515625, -0.29705810546875, -0.226318359375, -0.15557861328125, -0.0848388671875, -0.01409912109375, 0.056640625, 0.12738037109375, 0.1981201171875, 0.26885986328125, 0.339599609375, 0.41033935546875, 0.4810791015625, 0.55181884765625, 0.62255859375, 0.69329833984375, 0.7640380859375, 0.83477783203125, 0.905517578125, 0.97625732421875, 1.0469970703125, 1.11773681640625, 1.1884765625, 1.25921630859375, 1.3299560546875, 1.40069580078125, 1.471435546875, 1.54217529296875, 1.6129150390625, 1.68365478515625, 1.75439453125, 1.82513427734375, 1.8958740234375, 1.96661376953125, 2.037353515625, 2.10809326171875, 2.1788330078125, 2.24957275390625, 2.3203125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 6.0, 7.0, 5.0, 8.0, 10.0, 14.0, 18.0, 19.0, 23.0, 31.0, 43.0, 75.0, 94.0, 112.0, 133.0, 93.0, 86.0, 63.0, 47.0, 24.0, 24.0, 15.0, 17.0, 14.0, 11.0, 4.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003299713134765625, -0.00032063573598861694, -0.0003113001585006714, -0.00030196458101272583, -0.0002926290035247803, -0.0002832934260368347, -0.00027395784854888916, -0.0002646222710609436, -0.00025528669357299805, -0.0002459511160850525, -0.00023661553859710693, -0.00022727996110916138, -0.00021794438362121582, -0.00020860880613327026, -0.0001992732286453247, -0.00018993765115737915, -0.0001806020736694336, -0.00017126649618148804, -0.00016193091869354248, -0.00015259534120559692, -0.00014325976371765137, -0.0001339241862297058, -0.00012458860874176025, -0.0001152530312538147, -0.00010591745376586914, -9.658187627792358e-05, -8.724629878997803e-05, -7.791072130203247e-05, -6.857514381408691e-05, -5.923956632614136e-05, -4.99039888381958e-05, -4.0568411350250244e-05, -3.123283386230469e-05, -2.189725637435913e-05, -1.2561678886413574e-05, -3.2261013984680176e-06, 6.109476089477539e-06, 1.5445053577423096e-05, 2.4780631065368652e-05, 3.411620855331421e-05, 4.3451786041259766e-05, 5.278736352920532e-05, 6.212294101715088e-05, 7.145851850509644e-05, 8.079409599304199e-05, 9.012967348098755e-05, 9.94652509689331e-05, 0.00010880082845687866, 0.00011813640594482422, 0.00012747198343276978, 0.00013680756092071533, 0.0001461431384086609, 0.00015547871589660645, 0.000164814293384552, 0.00017414987087249756, 0.00018348544836044312, 0.00019282102584838867, 0.00020215660333633423, 0.00021149218082427979, 0.00022082775831222534, 0.0002301633358001709, 0.00023949891328811646, 0.000248834490776062, 0.00025817006826400757, 0.0002675056457519531]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 8.0, 11.0, 11.0, 21.0, 15.0, 28.0, 40.0, 60.0, 91.0, 131.0, 201.0, 305.0, 442.0, 697.0, 1169.0, 1794.0, 2745.0, 4402.0, 6929.0, 10678.0, 16945.0, 27299.0, 44807.0, 77984.0, 157932.0, 374432.0, 138053.0, 71173.0, 41159.0, 25308.0, 15875.0, 10154.0, 6368.0, 4028.0, 2547.0, 1626.0, 1054.0, 694.0, 448.0, 306.0, 190.0, 118.0, 91.0, 59.0, 44.0, 28.0, 22.0, 11.0, 7.0, 4.0, 5.0, 4.0, 5.0, 1.0, 1.0], "bins": [-8.1328125, -7.89654541015625, -7.6602783203125, -7.42401123046875, -7.187744140625, -6.95147705078125, -6.7152099609375, -6.47894287109375, -6.24267578125, -6.00640869140625, -5.7701416015625, -5.53387451171875, -5.297607421875, -5.06134033203125, -4.8250732421875, -4.58880615234375, -4.3525390625, -4.11627197265625, -3.8800048828125, -3.64373779296875, -3.407470703125, -3.17120361328125, -2.9349365234375, -2.69866943359375, -2.46240234375, -2.22613525390625, -1.9898681640625, -1.75360107421875, -1.517333984375, -1.28106689453125, -1.0447998046875, -0.80853271484375, -0.572265625, -0.33599853515625, -0.0997314453125, 0.13653564453125, 0.372802734375, 0.60906982421875, 0.8453369140625, 1.08160400390625, 1.31787109375, 1.55413818359375, 1.7904052734375, 2.02667236328125, 2.262939453125, 2.49920654296875, 2.7354736328125, 2.97174072265625, 3.2080078125, 3.44427490234375, 3.6805419921875, 3.91680908203125, 4.153076171875, 4.38934326171875, 4.6256103515625, 4.86187744140625, 5.09814453125, 5.33441162109375, 5.5706787109375, 5.80694580078125, 6.043212890625, 6.27947998046875, 6.5157470703125, 6.75201416015625, 6.98828125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 6.0, 6.0, 14.0, 14.0, 16.0, 22.0, 21.0, 16.0, 26.0, 24.0, 25.0, 36.0, 23.0, 31.0, 23.0, 42.0, 36.0, 37.0, 33.0, 45.0, 58.0, 40.0, 53.0, 32.0, 27.0, 34.0, 22.0, 18.0, 25.0, 20.0, 32.0, 17.0, 27.0, 19.0, 23.0, 20.0, 6.0, 12.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.767578125, -1.7047119140625, -1.641845703125, -1.5789794921875, -1.51611328125, -1.4532470703125, -1.390380859375, -1.3275146484375, -1.2646484375, -1.2017822265625, -1.138916015625, -1.0760498046875, -1.01318359375, -0.9503173828125, -0.887451171875, -0.8245849609375, -0.76171875, -0.6988525390625, -0.635986328125, -0.5731201171875, -0.51025390625, -0.4473876953125, -0.384521484375, -0.3216552734375, -0.2587890625, -0.1959228515625, -0.133056640625, -0.0701904296875, -0.00732421875, 0.0555419921875, 0.118408203125, 0.1812744140625, 0.244140625, 0.3070068359375, 0.369873046875, 0.4327392578125, 0.49560546875, 0.5584716796875, 0.621337890625, 0.6842041015625, 0.7470703125, 0.8099365234375, 0.872802734375, 0.9356689453125, 0.99853515625, 1.0614013671875, 1.124267578125, 1.1871337890625, 1.25, 1.3128662109375, 1.375732421875, 1.4385986328125, 1.50146484375, 1.5643310546875, 1.627197265625, 1.6900634765625, 1.7529296875, 1.8157958984375, 1.878662109375, 1.9415283203125, 2.00439453125, 2.0672607421875, 2.130126953125, 2.1929931640625, 2.255859375]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 3.0, 4.0, 8.0, 2.0, 4.0, 11.0, 14.0, 10.0, 15.0, 38.0, 38.0, 46.0, 79.0, 101.0, 117.0, 123.0, 77.0, 75.0, 47.0, 42.0, 36.0, 21.0, 12.0, 18.0, 14.0, 8.0, 4.0, 6.0, 4.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.491065979003906, -32.5022087097168, -31.513349533081055, -30.524490356445312, -29.535633087158203, -28.54677391052246, -27.55791473388672, -26.56905746459961, -25.5802001953125, -24.591341018676758, -23.60248374938965, -22.613624572753906, -21.624767303466797, -20.635908126831055, -19.647048950195312, -18.658191680908203, -17.66933250427246, -16.68047332763672, -15.69161605834961, -14.702756881713867, -13.713899612426758, -12.725040435791016, -11.73618221282959, -10.747323989868164, -9.758465766906738, -8.769607543945312, -7.780749320983887, -6.791890621185303, -5.803032398223877, -4.814174175262451, -3.825315475463867, -2.8364572525024414, -1.8476009368896484, -0.8587425947189331, 0.13011574745178223, 1.118974208831787, 2.107832431793213, 3.0966906547546387, 4.085549354553223, 5.074407577514648, 6.063265800476074, 7.0521240234375, 8.040982246398926, 9.029840469360352, 10.018699645996094, 11.007556915283203, 11.996416091918945, 12.985274314880371, 13.974132537841797, 14.962990760803223, 15.951848983764648, 16.94070816040039, 17.9295654296875, 18.918424606323242, 19.907283782958984, 20.896141052246094, 21.884998321533203, 22.873857498168945, 23.862714767456055, 24.851573944091797, 25.840431213378906, 26.82929039001465, 27.81814956665039, 28.8070068359375, 29.795866012573242]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 1.0, 8.0, 6.0, 8.0, 15.0, 12.0, 11.0, 9.0, 11.0, 30.0, 25.0, 24.0, 32.0, 27.0, 31.0, 25.0, 46.0, 42.0, 53.0, 40.0, 52.0, 42.0, 46.0, 42.0, 48.0, 39.0, 27.0, 26.0, 35.0, 36.0, 28.0, 41.0, 15.0, 17.0, 7.0, 13.0, 12.0, 4.0, 6.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-25.615386962890625, -24.897350311279297, -24.17931365966797, -23.46127700805664, -22.743242263793945, -22.025205612182617, -21.30716896057129, -20.58913230895996, -19.871095657348633, -19.153059005737305, -18.435022354125977, -17.71698760986328, -16.998950958251953, -16.280914306640625, -15.562877655029297, -14.844841003417969, -14.126805305480957, -13.408768653869629, -12.690732955932617, -11.972696304321289, -11.254659652709961, -10.536623001098633, -9.818587303161621, -9.100550651550293, -8.382514953613281, -7.664478778839111, -6.946442127227783, -6.228405952453613, -5.510369300842285, -4.792333126068115, -4.074296951293945, -3.356260299682617, -2.638223648071289, -1.92018723487854, -1.2021509408950806, -0.4841146469116211, 0.23392176628112793, 0.951958179473877, 1.6699943542480469, 2.388031005859375, 3.106067180633545, 3.824103593826294, 4.542140007019043, 5.260176181793213, 5.978212356567383, 6.696249008178711, 7.414285182952881, 8.132322311401367, 8.850358009338379, 9.568394660949707, 10.286430358886719, 11.004467010498047, 11.722503662109375, 12.440540313720703, 13.158576011657715, 13.876612663269043, 14.594648361206055, 15.312685012817383, 16.03072166442871, 16.748756408691406, 17.466793060302734, 18.184829711914062, 18.90286636352539, 19.62090301513672, 20.338939666748047]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 7.0, 8.0, 21.0, 23.0, 27.0, 47.0, 78.0, 102.0, 180.0, 268.0, 418.0, 616.0, 868.0, 1376.0, 2069.0, 3254.0, 4731.0, 7357.0, 11182.0, 17534.0, 27545.0, 44595.0, 73360.0, 123567.0, 200699.0, 203515.0, 125905.0, 74364.0, 45723.0, 28347.0, 17858.0, 11401.0, 7425.0, 4814.0, 3268.0, 2028.0, 1277.0, 918.0, 625.0, 384.0, 258.0, 171.0, 120.0, 77.0, 56.0, 30.0, 25.0, 12.0, 12.0, 7.0, 4.0, 6.0, 2.0, 1.0, 1.0], "bins": [-30.15625, -29.269775390625, -28.38330078125, -27.496826171875, -26.6103515625, -25.723876953125, -24.83740234375, -23.950927734375, -23.064453125, -22.177978515625, -21.29150390625, -20.405029296875, -19.5185546875, -18.632080078125, -17.74560546875, -16.859130859375, -15.97265625, -15.086181640625, -14.19970703125, -13.313232421875, -12.4267578125, -11.540283203125, -10.65380859375, -9.767333984375, -8.880859375, -7.994384765625, -7.10791015625, -6.221435546875, -5.3349609375, -4.448486328125, -3.56201171875, -2.675537109375, -1.7890625, -0.902587890625, -0.01611328125, 0.870361328125, 1.7568359375, 2.643310546875, 3.52978515625, 4.416259765625, 5.302734375, 6.189208984375, 7.07568359375, 7.962158203125, 8.8486328125, 9.735107421875, 10.62158203125, 11.508056640625, 12.39453125, 13.281005859375, 14.16748046875, 15.053955078125, 15.9404296875, 16.826904296875, 17.71337890625, 18.599853515625, 19.486328125, 20.372802734375, 21.25927734375, 22.145751953125, 23.0322265625, 23.918701171875, 24.80517578125, 25.691650390625, 26.578125]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 8.0, 8.0, 10.0, 5.0, 12.0, 10.0, 9.0, 16.0, 29.0, 15.0, 17.0, 35.0, 27.0, 28.0, 38.0, 38.0, 38.0, 38.0, 55.0, 43.0, 45.0, 39.0, 39.0, 51.0, 39.0, 40.0, 29.0, 35.0, 29.0, 33.0, 27.0, 24.0, 19.0, 16.0, 14.0, 10.0, 7.0, 6.0, 7.0, 7.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.25, -18.614013671875, -17.97802734375, -17.342041015625, -16.7060546875, -16.070068359375, -15.43408203125, -14.798095703125, -14.162109375, -13.526123046875, -12.89013671875, -12.254150390625, -11.6181640625, -10.982177734375, -10.34619140625, -9.710205078125, -9.07421875, -8.438232421875, -7.80224609375, -7.166259765625, -6.5302734375, -5.894287109375, -5.25830078125, -4.622314453125, -3.986328125, -3.350341796875, -2.71435546875, -2.078369140625, -1.4423828125, -0.806396484375, -0.17041015625, 0.465576171875, 1.1015625, 1.737548828125, 2.37353515625, 3.009521484375, 3.6455078125, 4.281494140625, 4.91748046875, 5.553466796875, 6.189453125, 6.825439453125, 7.46142578125, 8.097412109375, 8.7333984375, 9.369384765625, 10.00537109375, 10.641357421875, 11.27734375, 11.913330078125, 12.54931640625, 13.185302734375, 13.8212890625, 14.457275390625, 15.09326171875, 15.729248046875, 16.365234375, 17.001220703125, 17.63720703125, 18.273193359375, 18.9091796875, 19.545166015625, 20.18115234375, 20.817138671875, 21.453125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 7.0, 6.0, 14.0, 24.0, 26.0, 32.0, 50.0, 99.0, 163.0, 301.0, 457.0, 839.0, 1252.0, 2072.0, 3624.0, 6412.0, 11664.0, 21832.0, 40930.0, 81340.0, 170113.0, 312668.0, 199055.0, 93434.0, 47470.0, 24241.0, 13251.0, 7341.0, 4023.0, 2301.0, 1331.0, 876.0, 492.0, 333.0, 190.0, 133.0, 59.0, 35.0, 22.0, 12.0, 15.0, 8.0, 4.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0], "bins": [-46.25, -44.986328125, -43.72265625, -42.458984375, -41.1953125, -39.931640625, -38.66796875, -37.404296875, -36.140625, -34.876953125, -33.61328125, -32.349609375, -31.0859375, -29.822265625, -28.55859375, -27.294921875, -26.03125, -24.767578125, -23.50390625, -22.240234375, -20.9765625, -19.712890625, -18.44921875, -17.185546875, -15.921875, -14.658203125, -13.39453125, -12.130859375, -10.8671875, -9.603515625, -8.33984375, -7.076171875, -5.8125, -4.548828125, -3.28515625, -2.021484375, -0.7578125, 0.505859375, 1.76953125, 3.033203125, 4.296875, 5.560546875, 6.82421875, 8.087890625, 9.3515625, 10.615234375, 11.87890625, 13.142578125, 14.40625, 15.669921875, 16.93359375, 18.197265625, 19.4609375, 20.724609375, 21.98828125, 23.251953125, 24.515625, 25.779296875, 27.04296875, 28.306640625, 29.5703125, 30.833984375, 32.09765625, 33.361328125, 34.625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 3.0, 7.0, 6.0, 11.0, 4.0, 9.0, 16.0, 14.0, 13.0, 17.0, 23.0, 27.0, 31.0, 30.0, 30.0, 39.0, 41.0, 46.0, 32.0, 38.0, 35.0, 47.0, 53.0, 49.0, 43.0, 48.0, 46.0, 40.0, 20.0, 30.0, 22.0, 20.0, 26.0, 16.0, 14.0, 9.0, 12.0, 5.0, 6.0, 11.0, 3.0, 4.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-16.484375, -16.020263671875, -15.55615234375, -15.092041015625, -14.6279296875, -14.163818359375, -13.69970703125, -13.235595703125, -12.771484375, -12.307373046875, -11.84326171875, -11.379150390625, -10.9150390625, -10.450927734375, -9.98681640625, -9.522705078125, -9.05859375, -8.594482421875, -8.13037109375, -7.666259765625, -7.2021484375, -6.738037109375, -6.27392578125, -5.809814453125, -5.345703125, -4.881591796875, -4.41748046875, -3.953369140625, -3.4892578125, -3.025146484375, -2.56103515625, -2.096923828125, -1.6328125, -1.168701171875, -0.70458984375, -0.240478515625, 0.2236328125, 0.687744140625, 1.15185546875, 1.615966796875, 2.080078125, 2.544189453125, 3.00830078125, 3.472412109375, 3.9365234375, 4.400634765625, 4.86474609375, 5.328857421875, 5.79296875, 6.257080078125, 6.72119140625, 7.185302734375, 7.6494140625, 8.113525390625, 8.57763671875, 9.041748046875, 9.505859375, 9.969970703125, 10.43408203125, 10.898193359375, 11.3623046875, 11.826416015625, 12.29052734375, 12.754638671875, 13.21875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 10.0, 13.0, 17.0, 20.0, 30.0, 30.0, 56.0, 85.0, 117.0, 189.0, 267.0, 442.0, 751.0, 1284.0, 2161.0, 4229.0, 8540.0, 23062.0, 98492.0, 724031.0, 135787.0, 28383.0, 9836.0, 4569.0, 2504.0, 1429.0, 806.0, 506.0, 322.0, 175.0, 122.0, 74.0, 68.0, 40.0, 34.0, 16.0, 22.0, 7.0, 6.0, 3.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-81.0625, -78.2265625, -75.390625, -72.5546875, -69.71875, -66.8828125, -64.046875, -61.2109375, -58.375, -55.5390625, -52.703125, -49.8671875, -47.03125, -44.1953125, -41.359375, -38.5234375, -35.6875, -32.8515625, -30.015625, -27.1796875, -24.34375, -21.5078125, -18.671875, -15.8359375, -13.0, -10.1640625, -7.328125, -4.4921875, -1.65625, 1.1796875, 4.015625, 6.8515625, 9.6875, 12.5234375, 15.359375, 18.1953125, 21.03125, 23.8671875, 26.703125, 29.5390625, 32.375, 35.2109375, 38.046875, 40.8828125, 43.71875, 46.5546875, 49.390625, 52.2265625, 55.0625, 57.8984375, 60.734375, 63.5703125, 66.40625, 69.2421875, 72.078125, 74.9140625, 77.75, 80.5859375, 83.421875, 86.2578125, 89.09375, 91.9296875, 94.765625, 97.6015625, 100.4375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 7.0, 5.0, 9.0, 13.0, 7.0, 19.0, 31.0, 38.0, 81.0, 165.0, 203.0, 151.0, 90.0, 59.0, 29.0, 29.0, 13.0, 12.0, 10.0, 5.0, 7.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00360870361328125, -0.0035097599029541016, -0.003410816192626953, -0.0033118724822998047, -0.0032129287719726562, -0.003113985061645508, -0.0030150413513183594, -0.002916097640991211, -0.0028171539306640625, -0.002718210220336914, -0.0026192665100097656, -0.002520322799682617, -0.0024213790893554688, -0.0023224353790283203, -0.002223491668701172, -0.0021245479583740234, -0.002025604248046875, -0.0019266605377197266, -0.0018277168273925781, -0.0017287731170654297, -0.0016298294067382812, -0.0015308856964111328, -0.0014319419860839844, -0.001332998275756836, -0.0012340545654296875, -0.001135110855102539, -0.0010361671447753906, -0.0009372234344482422, -0.0008382797241210938, -0.0007393360137939453, -0.0006403923034667969, -0.0005414485931396484, -0.0004425048828125, -0.00034356117248535156, -0.0002446174621582031, -0.0001456737518310547, -4.673004150390625e-05, 5.221366882324219e-05, 0.00015115737915039062, 0.00025010108947753906, 0.0003490447998046875, 0.00044798851013183594, 0.0005469322204589844, 0.0006458759307861328, 0.0007448196411132812, 0.0008437633514404297, 0.0009427070617675781, 0.0010416507720947266, 0.001140594482421875, 0.0012395381927490234, 0.0013384819030761719, 0.0014374256134033203, 0.0015363693237304688, 0.0016353130340576172, 0.0017342567443847656, 0.001833200454711914, 0.0019321441650390625, 0.002031087875366211, 0.0021300315856933594, 0.002228975296020508, 0.0023279190063476562, 0.0024268627166748047, 0.002525806427001953, 0.0026247501373291016, 0.00272369384765625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 14.0, 11.0, 20.0, 39.0, 38.0, 74.0, 108.0, 151.0, 251.0, 381.0, 589.0, 964.0, 1527.0, 2570.0, 4856.0, 10619.0, 34621.0, 225139.0, 674430.0, 61887.0, 15816.0, 6210.0, 3242.0, 1869.0, 1149.0, 679.0, 460.0, 273.0, 187.0, 124.0, 82.0, 55.0, 43.0, 26.0, 13.0, 13.0, 8.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.8125, -91.7724609375, -88.732421875, -85.6923828125, -82.65234375, -79.6123046875, -76.572265625, -73.5322265625, -70.4921875, -67.4521484375, -64.412109375, -61.3720703125, -58.33203125, -55.2919921875, -52.251953125, -49.2119140625, -46.171875, -43.1318359375, -40.091796875, -37.0517578125, -34.01171875, -30.9716796875, -27.931640625, -24.8916015625, -21.8515625, -18.8115234375, -15.771484375, -12.7314453125, -9.69140625, -6.6513671875, -3.611328125, -0.5712890625, 2.46875, 5.5087890625, 8.548828125, 11.5888671875, 14.62890625, 17.6689453125, 20.708984375, 23.7490234375, 26.7890625, 29.8291015625, 32.869140625, 35.9091796875, 38.94921875, 41.9892578125, 45.029296875, 48.0693359375, 51.109375, 54.1494140625, 57.189453125, 60.2294921875, 63.26953125, 66.3095703125, 69.349609375, 72.3896484375, 75.4296875, 78.4697265625, 81.509765625, 84.5498046875, 87.58984375, 90.6298828125, 93.669921875, 96.7099609375, 99.75]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 5.0, 4.0, 7.0, 5.0, 9.0, 25.0, 46.0, 61.0, 83.0, 130.0, 164.0, 138.0, 115.0, 68.0, 42.0, 25.0, 20.0, 12.0, 7.0, 2.0, 4.0, 5.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.25, -22.5380859375, -21.826171875, -21.1142578125, -20.40234375, -19.6904296875, -18.978515625, -18.2666015625, -17.5546875, -16.8427734375, -16.130859375, -15.4189453125, -14.70703125, -13.9951171875, -13.283203125, -12.5712890625, -11.859375, -11.1474609375, -10.435546875, -9.7236328125, -9.01171875, -8.2998046875, -7.587890625, -6.8759765625, -6.1640625, -5.4521484375, -4.740234375, -4.0283203125, -3.31640625, -2.6044921875, -1.892578125, -1.1806640625, -0.46875, 0.2431640625, 0.955078125, 1.6669921875, 2.37890625, 3.0908203125, 3.802734375, 4.5146484375, 5.2265625, 5.9384765625, 6.650390625, 7.3623046875, 8.07421875, 8.7861328125, 9.498046875, 10.2099609375, 10.921875, 11.6337890625, 12.345703125, 13.0576171875, 13.76953125, 14.4814453125, 15.193359375, 15.9052734375, 16.6171875, 17.3291015625, 18.041015625, 18.7529296875, 19.46484375, 20.1767578125, 20.888671875, 21.6005859375, 22.3125]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 4.0, 4.0, 8.0, 15.0, 21.0, 31.0, 39.0, 48.0, 57.0, 98.0, 118.0, 122.0, 74.0, 64.0, 57.0, 55.0, 30.0, 28.0, 23.0, 11.0, 18.0, 13.0, 8.0, 11.0, 5.0, 3.0, 4.0, 8.0, 5.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.75190544128418, -27.78050994873047, -26.809112548828125, -25.837717056274414, -24.866321563720703, -23.89492416381836, -22.92352867126465, -21.952133178710938, -20.980735778808594, -20.009340286254883, -19.03794288635254, -18.066547393798828, -17.095151901245117, -16.123756408691406, -15.152359008789062, -14.180963516235352, -13.20956802368164, -12.238171577453613, -11.266776084899902, -10.295379638671875, -9.323984146118164, -8.352587699890137, -7.381191253662109, -6.40979528427124, -5.438399314880371, -4.467003345489502, -3.4956071376800537, -2.5242109298706055, -1.5528149604797363, -0.5814189910888672, 0.38997745513916016, 1.3613734245300293, 2.3327674865722656, 3.3041634559631348, 4.275559425354004, 5.246955871582031, 6.2183518409729, 7.1897478103637695, 8.161144256591797, 9.132539749145508, 10.103936195373535, 11.075332641601562, 12.046728134155273, 13.0181245803833, 13.989521026611328, 14.960916519165039, 15.932312965393066, 16.903709411621094, 17.875104904174805, 18.846500396728516, 19.81789779663086, 20.78929328918457, 21.76068878173828, 22.732086181640625, 23.703481674194336, 24.674877166748047, 25.64627456665039, 26.6176700592041, 27.589067459106445, 28.560462951660156, 29.531858444213867, 30.503253936767578, 31.474651336669922, 32.446048736572266, 33.417442321777344]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 8.0, 7.0, 4.0, 10.0, 11.0, 10.0, 9.0, 15.0, 12.0, 19.0, 19.0, 21.0, 35.0, 24.0, 31.0, 34.0, 32.0, 29.0, 36.0, 28.0, 54.0, 39.0, 30.0, 40.0, 43.0, 37.0, 39.0, 19.0, 25.0, 30.0, 25.0, 33.0, 22.0, 20.0, 12.0, 25.0, 21.0, 19.0, 12.0, 7.0, 13.0, 11.0, 4.0, 7.0, 4.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-21.123947143554688, -20.475723266601562, -19.827499389648438, -19.179275512695312, -18.531051635742188, -17.882827758789062, -17.234603881835938, -16.586380004882812, -15.938157081604004, -15.289933204650879, -14.641709327697754, -13.993485450744629, -13.34526252746582, -12.697038650512695, -12.04881477355957, -11.400590896606445, -10.75236701965332, -10.104143142700195, -9.45591926574707, -8.807695388793945, -8.15947151184082, -7.5112481117248535, -6.863024711608887, -6.214800834655762, -5.566576957702637, -4.918353080749512, -4.270129203796387, -3.62190580368042, -2.973681926727295, -2.32545804977417, -1.677234411239624, -1.0290107727050781, -0.38078880310058594, 0.2674349546432495, 0.915658712387085, 1.5638824701309204, 2.212106227874756, 2.860330104827881, 3.5085537433624268, 4.156777381896973, 4.805001258850098, 5.453225135803223, 6.101449012756348, 6.7496724128723145, 7.3978962898254395, 8.046119689941406, 8.694343566894531, 9.342567443847656, 9.990791320800781, 10.639015197753906, 11.287239074707031, 11.935462951660156, 12.583686828613281, 13.231910705566406, 13.880133628845215, 14.52835750579834, 15.176581382751465, 15.82480525970459, 16.4730281829834, 17.121252059936523, 17.76947593688965, 18.417699813842773, 19.0659236907959, 19.714147567749023, 20.36237144470215]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [6.0, 1.0, 2.0, 1.0, 4.0, 8.0, 12.0, 18.0, 23.0, 38.0, 36.0, 62.0, 84.0, 138.0, 198.0, 253.0, 347.0, 537.0, 775.0, 1100.0, 1607.0, 2266.0, 3305.0, 4844.0, 7170.0, 10828.0, 16639.0, 27685.0, 47425.0, 90150.0, 197626.0, 695873.0, 1975089.0, 693244.0, 198540.0, 90905.0, 49310.0, 28269.0, 17355.0, 10887.0, 7040.0, 4534.0, 3019.0, 2084.0, 1488.0, 1003.0, 705.0, 522.0, 383.0, 261.0, 175.0, 107.0, 93.0, 74.0, 47.0, 33.0, 19.0, 22.0, 6.0, 9.0, 8.0, 7.0, 2.0, 3.0], "bins": [-30.796875, -29.849609375, -28.90234375, -27.955078125, -27.0078125, -26.060546875, -25.11328125, -24.166015625, -23.21875, -22.271484375, -21.32421875, -20.376953125, -19.4296875, -18.482421875, -17.53515625, -16.587890625, -15.640625, -14.693359375, -13.74609375, -12.798828125, -11.8515625, -10.904296875, -9.95703125, -9.009765625, -8.0625, -7.115234375, -6.16796875, -5.220703125, -4.2734375, -3.326171875, -2.37890625, -1.431640625, -0.484375, 0.462890625, 1.41015625, 2.357421875, 3.3046875, 4.251953125, 5.19921875, 6.146484375, 7.09375, 8.041015625, 8.98828125, 9.935546875, 10.8828125, 11.830078125, 12.77734375, 13.724609375, 14.671875, 15.619140625, 16.56640625, 17.513671875, 18.4609375, 19.408203125, 20.35546875, 21.302734375, 22.25, 23.197265625, 24.14453125, 25.091796875, 26.0390625, 26.986328125, 27.93359375, 28.880859375, 29.828125]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 8.0, 4.0, 3.0, 6.0, 10.0, 6.0, 8.0, 14.0, 11.0, 12.0, 15.0, 21.0, 17.0, 22.0, 27.0, 27.0, 33.0, 33.0, 33.0, 40.0, 29.0, 31.0, 38.0, 42.0, 34.0, 37.0, 33.0, 33.0, 42.0, 33.0, 31.0, 20.0, 29.0, 24.0, 23.0, 27.0, 22.0, 16.0, 17.0, 15.0, 11.0, 14.0, 14.0, 8.0, 12.0, 5.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-11.5703125, -11.215087890625, -10.85986328125, -10.504638671875, -10.1494140625, -9.794189453125, -9.43896484375, -9.083740234375, -8.728515625, -8.373291015625, -8.01806640625, -7.662841796875, -7.3076171875, -6.952392578125, -6.59716796875, -6.241943359375, -5.88671875, -5.531494140625, -5.17626953125, -4.821044921875, -4.4658203125, -4.110595703125, -3.75537109375, -3.400146484375, -3.044921875, -2.689697265625, -2.33447265625, -1.979248046875, -1.6240234375, -1.268798828125, -0.91357421875, -0.558349609375, -0.203125, 0.152099609375, 0.50732421875, 0.862548828125, 1.2177734375, 1.572998046875, 1.92822265625, 2.283447265625, 2.638671875, 2.993896484375, 3.34912109375, 3.704345703125, 4.0595703125, 4.414794921875, 4.77001953125, 5.125244140625, 5.48046875, 5.835693359375, 6.19091796875, 6.546142578125, 6.9013671875, 7.256591796875, 7.61181640625, 7.967041015625, 8.322265625, 8.677490234375, 9.03271484375, 9.387939453125, 9.7431640625, 10.098388671875, 10.45361328125, 10.808837890625, 11.1640625]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 1.0, 7.0, 7.0, 18.0, 24.0, 33.0, 55.0, 88.0, 111.0, 206.0, 313.0, 428.0, 732.0, 1149.0, 1820.0, 2971.0, 4883.0, 8227.0, 14734.0, 26201.0, 51009.0, 106387.0, 260761.0, 910753.0, 1990910.0, 481729.0, 169936.0, 74726.0, 37739.0, 20085.0, 11338.0, 6735.0, 3819.0, 2372.0, 1449.0, 911.0, 538.0, 384.0, 263.0, 161.0, 103.0, 55.0, 47.0, 25.0, 17.0, 12.0, 6.0, 1.0, 2.0, 4.0, 3.0, 2.0], "bins": [-33.75, -32.819580078125, -31.88916015625, -30.958740234375, -30.0283203125, -29.097900390625, -28.16748046875, -27.237060546875, -26.306640625, -25.376220703125, -24.44580078125, -23.515380859375, -22.5849609375, -21.654541015625, -20.72412109375, -19.793701171875, -18.86328125, -17.932861328125, -17.00244140625, -16.072021484375, -15.1416015625, -14.211181640625, -13.28076171875, -12.350341796875, -11.419921875, -10.489501953125, -9.55908203125, -8.628662109375, -7.6982421875, -6.767822265625, -5.83740234375, -4.906982421875, -3.9765625, -3.046142578125, -2.11572265625, -1.185302734375, -0.2548828125, 0.675537109375, 1.60595703125, 2.536376953125, 3.466796875, 4.397216796875, 5.32763671875, 6.258056640625, 7.1884765625, 8.118896484375, 9.04931640625, 9.979736328125, 10.91015625, 11.840576171875, 12.77099609375, 13.701416015625, 14.6318359375, 15.562255859375, 16.49267578125, 17.423095703125, 18.353515625, 19.283935546875, 20.21435546875, 21.144775390625, 22.0751953125, 23.005615234375, 23.93603515625, 24.866455078125, 25.796875]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 12.0, 18.0, 15.0, 19.0, 25.0, 24.0, 35.0, 45.0, 50.0, 54.0, 71.0, 94.0, 105.0, 131.0, 143.0, 202.0, 269.0, 334.0, 363.0, 390.0, 313.0, 295.0, 182.0, 164.0, 148.0, 107.0, 84.0, 81.0, 58.0, 49.0, 39.0, 30.0, 13.0, 21.0, 25.0, 14.0, 7.0, 10.0, 8.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9375, -6.71478271484375, -6.4920654296875, -6.26934814453125, -6.046630859375, -5.82391357421875, -5.6011962890625, -5.37847900390625, -5.15576171875, -4.93304443359375, -4.7103271484375, -4.48760986328125, -4.264892578125, -4.04217529296875, -3.8194580078125, -3.59674072265625, -3.3740234375, -3.15130615234375, -2.9285888671875, -2.70587158203125, -2.483154296875, -2.26043701171875, -2.0377197265625, -1.81500244140625, -1.59228515625, -1.36956787109375, -1.1468505859375, -0.92413330078125, -0.701416015625, -0.47869873046875, -0.2559814453125, -0.03326416015625, 0.189453125, 0.41217041015625, 0.6348876953125, 0.85760498046875, 1.080322265625, 1.30303955078125, 1.5257568359375, 1.74847412109375, 1.97119140625, 2.19390869140625, 2.4166259765625, 2.63934326171875, 2.862060546875, 3.08477783203125, 3.3074951171875, 3.53021240234375, 3.7529296875, 3.97564697265625, 4.1983642578125, 4.42108154296875, 4.643798828125, 4.86651611328125, 5.0892333984375, 5.31195068359375, 5.53466796875, 5.75738525390625, 5.9801025390625, 6.20281982421875, 6.425537109375, 6.64825439453125, 6.8709716796875, 7.09368896484375, 7.31640625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 5.0, 1.0, 11.0, 12.0, 9.0, 10.0, 21.0, 24.0, 31.0, 50.0, 65.0, 87.0, 112.0, 153.0, 109.0, 76.0, 44.0, 44.0, 30.0, 26.0, 20.0, 11.0, 10.0, 2.0, 6.0, 10.0, 4.0, 1.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.554777145385742, -23.79597282409668, -23.037168502807617, -22.278364181518555, -21.519559860229492, -20.76075553894043, -20.001951217651367, -19.243146896362305, -18.484342575073242, -17.72553825378418, -16.966733932495117, -16.207929611206055, -15.449125289916992, -14.69032096862793, -13.931516647338867, -13.172712326049805, -12.413907051086426, -11.655102729797363, -10.8962984085083, -10.137494087219238, -9.378689765930176, -8.619885444641113, -7.861080646514893, -7.10227632522583, -6.343472003936768, -5.584667682647705, -4.825863361358643, -4.067058563232422, -3.3082544803619385, -2.549450159072876, -1.7906455993652344, -1.0318412780761719, -0.2730369567871094, 0.4857674241065979, 1.2445718050003052, 2.0033762454986572, 2.7621805667877197, 3.5209848880767822, 4.279789447784424, 5.038593769073486, 5.797398090362549, 6.556202411651611, 7.315006732940674, 8.073811531066895, 8.832615852355957, 9.59142017364502, 10.350224494934082, 11.109028816223145, 11.867833137512207, 12.62663745880127, 13.385441780090332, 14.144246101379395, 14.903050422668457, 15.66185474395752, 16.4206600189209, 17.17946434020996, 17.938268661499023, 18.697072982788086, 19.45587730407715, 20.21468162536621, 20.973485946655273, 21.732290267944336, 22.4910945892334, 23.24989891052246, 24.008703231811523]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 7.0, 10.0, 2.0, 10.0, 11.0, 10.0, 8.0, 6.0, 10.0, 15.0, 14.0, 16.0, 21.0, 25.0, 20.0, 24.0, 25.0, 27.0, 35.0, 40.0, 29.0, 36.0, 31.0, 28.0, 31.0, 50.0, 38.0, 45.0, 24.0, 27.0, 31.0, 36.0, 20.0, 32.0, 23.0, 22.0, 25.0, 20.0, 18.0, 12.0, 9.0, 9.0, 11.0, 10.0, 7.0, 13.0, 8.0, 9.0, 2.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-11.745596885681152, -11.364648818969727, -10.9837007522583, -10.602752685546875, -10.221805572509766, -9.84085750579834, -9.459909439086914, -9.078961372375488, -8.698013305664062, -8.317065238952637, -7.936117172241211, -7.555169582366943, -7.174221515655518, -6.793273448944092, -6.412325859069824, -6.031377792358398, -5.650429725646973, -5.269481658935547, -4.888533592224121, -4.5075860023498535, -4.126637935638428, -3.745689868927002, -3.3647420406341553, -2.9837942123413086, -2.602846145629883, -2.221898078918457, -1.8409502506256104, -1.4600023031234741, -1.079054355621338, -0.6981064081192017, -0.31715846061706543, 0.06378936767578125, 0.44473838806152344, 0.8256863355636597, 1.206634283065796, 1.5875822305679321, 1.9685301780700684, 2.349478244781494, 2.730426073074341, 3.1113739013671875, 3.4923219680786133, 3.873270034790039, 4.254218101501465, 4.635165691375732, 5.016113758087158, 5.397061824798584, 5.778009414672852, 6.158957481384277, 6.539905548095703, 6.920853614807129, 7.301801681518555, 7.682749271392822, 8.063697814941406, 8.444644927978516, 8.825592994689941, 9.206541061401367, 9.587489128112793, 9.968437194824219, 10.349385261535645, 10.73033332824707, 11.11128044128418, 11.492228507995605, 11.873176574707031, 12.254124641418457, 12.635072708129883]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 6.0, 7.0, 6.0, 13.0, 19.0, 27.0, 49.0, 53.0, 79.0, 93.0, 148.0, 179.0, 292.0, 389.0, 487.0, 723.0, 1022.0, 1398.0, 1971.0, 2865.0, 4288.0, 6288.0, 9733.0, 15255.0, 24646.0, 42096.0, 75482.0, 150344.0, 306109.0, 186939.0, 89491.0, 48865.0, 28508.0, 17076.0, 10925.0, 7146.0, 4686.0, 3286.0, 2150.0, 1560.0, 1087.0, 794.0, 529.0, 420.0, 296.0, 208.0, 120.0, 120.0, 79.0, 60.0, 35.0, 32.0, 22.0, 20.0, 14.0, 12.0, 9.0, 7.0, 3.0, 3.0, 0.0, 1.0], "bins": [-5.73828125, -5.55096435546875, -5.3636474609375, -5.17633056640625, -4.989013671875, -4.80169677734375, -4.6143798828125, -4.42706298828125, -4.23974609375, -4.05242919921875, -3.8651123046875, -3.67779541015625, -3.490478515625, -3.30316162109375, -3.1158447265625, -2.92852783203125, -2.7412109375, -2.55389404296875, -2.3665771484375, -2.17926025390625, -1.991943359375, -1.80462646484375, -1.6173095703125, -1.42999267578125, -1.24267578125, -1.05535888671875, -0.8680419921875, -0.68072509765625, -0.493408203125, -0.30609130859375, -0.1187744140625, 0.06854248046875, 0.255859375, 0.44317626953125, 0.6304931640625, 0.81781005859375, 1.005126953125, 1.19244384765625, 1.3797607421875, 1.56707763671875, 1.75439453125, 1.94171142578125, 2.1290283203125, 2.31634521484375, 2.503662109375, 2.69097900390625, 2.8782958984375, 3.06561279296875, 3.2529296875, 3.44024658203125, 3.6275634765625, 3.81488037109375, 4.002197265625, 4.18951416015625, 4.3768310546875, 4.56414794921875, 4.75146484375, 4.93878173828125, 5.1260986328125, 5.31341552734375, 5.500732421875, 5.68804931640625, 5.8753662109375, 6.06268310546875, 6.25]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 1.0, 3.0, 3.0, 2.0, 4.0, 8.0, 5.0, 5.0, 13.0, 8.0, 11.0, 8.0, 13.0, 10.0, 19.0, 19.0, 30.0, 12.0, 24.0, 20.0, 30.0, 35.0, 31.0, 39.0, 38.0, 39.0, 38.0, 34.0, 27.0, 47.0, 42.0, 23.0, 34.0, 34.0, 36.0, 27.0, 22.0, 25.0, 25.0, 19.0, 22.0, 12.0, 17.0, 15.0, 14.0, 12.0, 3.0, 8.0, 7.0, 8.0, 8.0, 5.0, 2.0, 6.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.2890625, -11.894287109375, -11.49951171875, -11.104736328125, -10.7099609375, -10.315185546875, -9.92041015625, -9.525634765625, -9.130859375, -8.736083984375, -8.34130859375, -7.946533203125, -7.5517578125, -7.156982421875, -6.76220703125, -6.367431640625, -5.97265625, -5.577880859375, -5.18310546875, -4.788330078125, -4.3935546875, -3.998779296875, -3.60400390625, -3.209228515625, -2.814453125, -2.419677734375, -2.02490234375, -1.630126953125, -1.2353515625, -0.840576171875, -0.44580078125, -0.051025390625, 0.34375, 0.738525390625, 1.13330078125, 1.528076171875, 1.9228515625, 2.317626953125, 2.71240234375, 3.107177734375, 3.501953125, 3.896728515625, 4.29150390625, 4.686279296875, 5.0810546875, 5.475830078125, 5.87060546875, 6.265380859375, 6.66015625, 7.054931640625, 7.44970703125, 7.844482421875, 8.2392578125, 8.634033203125, 9.02880859375, 9.423583984375, 9.818359375, 10.213134765625, 10.60791015625, 11.002685546875, 11.3974609375, 11.792236328125, 12.18701171875, 12.581787109375, 12.9765625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [7.0, 3.0, 3.0, 7.0, 8.0, 5.0, 13.0, 27.0, 23.0, 31.0, 47.0, 73.0, 101.0, 127.0, 155.0, 248.0, 310.0, 477.0, 594.0, 846.0, 1229.0, 1735.0, 2455.0, 3768.0, 5784.0, 9417.0, 15632.0, 27898.0, 55696.0, 132155.0, 413192.0, 210591.0, 76968.0, 36429.0, 19748.0, 11414.0, 7034.0, 4522.0, 2872.0, 2031.0, 1344.0, 1007.0, 673.0, 505.0, 349.0, 253.0, 219.0, 128.0, 101.0, 78.0, 66.0, 44.0, 33.0, 21.0, 20.0, 8.0, 16.0, 4.0, 6.0, 8.0, 6.0, 5.0, 0.0, 7.0], "bins": [-7.96875, -7.709228515625, -7.44970703125, -7.190185546875, -6.9306640625, -6.671142578125, -6.41162109375, -6.152099609375, -5.892578125, -5.633056640625, -5.37353515625, -5.114013671875, -4.8544921875, -4.594970703125, -4.33544921875, -4.075927734375, -3.81640625, -3.556884765625, -3.29736328125, -3.037841796875, -2.7783203125, -2.518798828125, -2.25927734375, -1.999755859375, -1.740234375, -1.480712890625, -1.22119140625, -0.961669921875, -0.7021484375, -0.442626953125, -0.18310546875, 0.076416015625, 0.3359375, 0.595458984375, 0.85498046875, 1.114501953125, 1.3740234375, 1.633544921875, 1.89306640625, 2.152587890625, 2.412109375, 2.671630859375, 2.93115234375, 3.190673828125, 3.4501953125, 3.709716796875, 3.96923828125, 4.228759765625, 4.48828125, 4.747802734375, 5.00732421875, 5.266845703125, 5.5263671875, 5.785888671875, 6.04541015625, 6.304931640625, 6.564453125, 6.823974609375, 7.08349609375, 7.343017578125, 7.6025390625, 7.862060546875, 8.12158203125, 8.381103515625, 8.640625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 7.0, 10.0, 9.0, 11.0, 7.0, 13.0, 16.0, 27.0, 23.0, 26.0, 35.0, 36.0, 38.0, 39.0, 43.0, 41.0, 43.0, 57.0, 50.0, 49.0, 32.0, 57.0, 44.0, 40.0, 27.0, 28.0, 29.0, 33.0, 24.0, 24.0, 12.0, 16.0, 8.0, 8.0, 6.0, 8.0, 8.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.875, -10.5333251953125, -10.191650390625, -9.8499755859375, -9.50830078125, -9.1666259765625, -8.824951171875, -8.4832763671875, -8.1416015625, -7.7999267578125, -7.458251953125, -7.1165771484375, -6.77490234375, -6.4332275390625, -6.091552734375, -5.7498779296875, -5.408203125, -5.0665283203125, -4.724853515625, -4.3831787109375, -4.04150390625, -3.6998291015625, -3.358154296875, -3.0164794921875, -2.6748046875, -2.3331298828125, -1.991455078125, -1.6497802734375, -1.30810546875, -0.9664306640625, -0.624755859375, -0.2830810546875, 0.05859375, 0.4002685546875, 0.741943359375, 1.0836181640625, 1.42529296875, 1.7669677734375, 2.108642578125, 2.4503173828125, 2.7919921875, 3.1336669921875, 3.475341796875, 3.8170166015625, 4.15869140625, 4.5003662109375, 4.842041015625, 5.1837158203125, 5.525390625, 5.8670654296875, 6.208740234375, 6.5504150390625, 6.89208984375, 7.2337646484375, 7.575439453125, 7.9171142578125, 8.2587890625, 8.6004638671875, 8.942138671875, 9.2838134765625, 9.62548828125, 9.9671630859375, 10.308837890625, 10.6505126953125, 10.9921875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 8.0, 3.0, 4.0, 8.0, 3.0, 8.0, 13.0, 17.0, 27.0, 36.0, 43.0, 55.0, 66.0, 116.0, 168.0, 224.0, 306.0, 406.0, 568.0, 824.0, 1233.0, 1722.0, 2541.0, 4007.0, 6257.0, 10544.0, 17909.0, 33255.0, 69579.0, 210883.0, 479225.0, 104290.0, 45018.0, 23221.0, 13057.0, 7935.0, 4851.0, 3321.0, 2076.0, 1444.0, 961.0, 639.0, 462.0, 338.0, 244.0, 178.0, 111.0, 109.0, 68.0, 53.0, 35.0, 34.0, 21.0, 13.0, 8.0, 8.0, 5.0, 5.0, 2.0, 3.0, 1.0], "bins": [-1.99609375, -1.936004638671875, -1.87591552734375, -1.815826416015625, -1.7557373046875, -1.695648193359375, -1.63555908203125, -1.575469970703125, -1.515380859375, -1.455291748046875, -1.39520263671875, -1.335113525390625, -1.2750244140625, -1.214935302734375, -1.15484619140625, -1.094757080078125, -1.03466796875, -0.974578857421875, -0.91448974609375, -0.854400634765625, -0.7943115234375, -0.734222412109375, -0.67413330078125, -0.614044189453125, -0.553955078125, -0.493865966796875, -0.43377685546875, -0.373687744140625, -0.3135986328125, -0.253509521484375, -0.19342041015625, -0.133331298828125, -0.0732421875, -0.013153076171875, 0.04693603515625, 0.107025146484375, 0.1671142578125, 0.227203369140625, 0.28729248046875, 0.347381591796875, 0.407470703125, 0.467559814453125, 0.52764892578125, 0.587738037109375, 0.6478271484375, 0.707916259765625, 0.76800537109375, 0.828094482421875, 0.88818359375, 0.948272705078125, 1.00836181640625, 1.068450927734375, 1.1285400390625, 1.188629150390625, 1.24871826171875, 1.308807373046875, 1.368896484375, 1.428985595703125, 1.48907470703125, 1.549163818359375, 1.6092529296875, 1.669342041015625, 1.72943115234375, 1.789520263671875, 1.849609375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 3.0, 6.0, 3.0, 5.0, 5.0, 18.0, 11.0, 11.0, 23.0, 27.0, 30.0, 40.0, 84.0, 122.0, 159.0, 134.0, 90.0, 61.0, 45.0, 31.0, 20.0, 14.0, 7.0, 7.0, 12.0, 7.0, 4.0, 4.0, 4.0, 2.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.0002636909484863281, -0.0002565048635005951, -0.00024931877851486206, -0.00024213269352912903, -0.000234946608543396, -0.00022776052355766296, -0.00022057443857192993, -0.0002133883535861969, -0.00020620226860046387, -0.00019901618361473083, -0.0001918300986289978, -0.00018464401364326477, -0.00017745792865753174, -0.0001702718436717987, -0.00016308575868606567, -0.00015589967370033264, -0.0001487135887145996, -0.00014152750372886658, -0.00013434141874313354, -0.0001271553337574005, -0.00011996924877166748, -0.00011278316378593445, -0.00010559707880020142, -9.841099381446838e-05, -9.122490882873535e-05, -8.403882384300232e-05, -7.685273885726929e-05, -6.966665387153625e-05, -6.248056888580322e-05, -5.529448390007019e-05, -4.810839891433716e-05, -4.0922313928604126e-05, -3.3736228942871094e-05, -2.655014395713806e-05, -1.936405897140503e-05, -1.2177973985671997e-05, -4.991888999938965e-06, 2.1941959857940674e-06, 9.3802809715271e-06, 1.6566365957260132e-05, 2.3752450942993164e-05, 3.0938535928726196e-05, 3.812462091445923e-05, 4.531070590019226e-05, 5.249679088592529e-05, 5.9682875871658325e-05, 6.686896085739136e-05, 7.405504584312439e-05, 8.124113082885742e-05, 8.842721581459045e-05, 9.561330080032349e-05, 0.00010279938578605652, 0.00010998547077178955, 0.00011717155575752258, 0.00012435764074325562, 0.00013154372572898865, 0.00013872981071472168, 0.0001459158957004547, 0.00015310198068618774, 0.00016028806567192078, 0.0001674741506576538, 0.00017466023564338684, 0.00018184632062911987, 0.0001890324056148529, 0.00019621849060058594]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 4.0, 6.0, 5.0, 12.0, 13.0, 24.0, 34.0, 50.0, 86.0, 119.0, 180.0, 273.0, 403.0, 601.0, 861.0, 1376.0, 1920.0, 2977.0, 4559.0, 6956.0, 10819.0, 17701.0, 28493.0, 49571.0, 95220.0, 345070.0, 269853.0, 89680.0, 47085.0, 27642.0, 16769.0, 10387.0, 6814.0, 4435.0, 2883.0, 1885.0, 1217.0, 816.0, 578.0, 406.0, 255.0, 187.0, 119.0, 79.0, 55.0, 32.0, 21.0, 10.0, 7.0, 9.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-5.10546875, -4.9505615234375, -4.795654296875, -4.6407470703125, -4.48583984375, -4.3309326171875, -4.176025390625, -4.0211181640625, -3.8662109375, -3.7113037109375, -3.556396484375, -3.4014892578125, -3.24658203125, -3.0916748046875, -2.936767578125, -2.7818603515625, -2.626953125, -2.4720458984375, -2.317138671875, -2.1622314453125, -2.00732421875, -1.8524169921875, -1.697509765625, -1.5426025390625, -1.3876953125, -1.2327880859375, -1.077880859375, -0.9229736328125, -0.76806640625, -0.6131591796875, -0.458251953125, -0.3033447265625, -0.1484375, 0.0064697265625, 0.161376953125, 0.3162841796875, 0.47119140625, 0.6260986328125, 0.781005859375, 0.9359130859375, 1.0908203125, 1.2457275390625, 1.400634765625, 1.5555419921875, 1.71044921875, 1.8653564453125, 2.020263671875, 2.1751708984375, 2.330078125, 2.4849853515625, 2.639892578125, 2.7947998046875, 2.94970703125, 3.1046142578125, 3.259521484375, 3.4144287109375, 3.5693359375, 3.7242431640625, 3.879150390625, 4.0340576171875, 4.18896484375, 4.3438720703125, 4.498779296875, 4.6536865234375, 4.80859375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 6.0, 1.0, 3.0, 4.0, 3.0, 7.0, 7.0, 8.0, 8.0, 16.0, 12.0, 25.0, 18.0, 13.0, 22.0, 27.0, 30.0, 20.0, 37.0, 23.0, 32.0, 44.0, 54.0, 62.0, 92.0, 47.0, 34.0, 34.0, 27.0, 24.0, 30.0, 29.0, 31.0, 20.0, 18.0, 22.0, 21.0, 18.0, 16.0, 10.0, 7.0, 10.0, 5.0, 12.0, 4.0, 3.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.22265625, -1.1833953857421875, -1.144134521484375, -1.1048736572265625, -1.06561279296875, -1.0263519287109375, -0.987091064453125, -0.9478302001953125, -0.9085693359375, -0.8693084716796875, -0.830047607421875, -0.7907867431640625, -0.75152587890625, -0.7122650146484375, -0.673004150390625, -0.6337432861328125, -0.594482421875, -0.5552215576171875, -0.515960693359375, -0.4766998291015625, -0.43743896484375, -0.3981781005859375, -0.358917236328125, -0.3196563720703125, -0.2803955078125, -0.2411346435546875, -0.201873779296875, -0.1626129150390625, -0.12335205078125, -0.0840911865234375, -0.044830322265625, -0.0055694580078125, 0.03369140625, 0.0729522705078125, 0.112213134765625, 0.1514739990234375, 0.19073486328125, 0.2299957275390625, 0.269256591796875, 0.3085174560546875, 0.3477783203125, 0.3870391845703125, 0.426300048828125, 0.4655609130859375, 0.50482177734375, 0.5440826416015625, 0.583343505859375, 0.6226043701171875, 0.661865234375, 0.7011260986328125, 0.740386962890625, 0.7796478271484375, 0.81890869140625, 0.8581695556640625, 0.897430419921875, 0.9366912841796875, 0.9759521484375, 1.0152130126953125, 1.054473876953125, 1.0937347412109375, 1.13299560546875, 1.1722564697265625, 1.211517333984375, 1.2507781982421875, 1.2900390625]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 7.0, 4.0, 4.0, 3.0, 9.0, 6.0, 13.0, 16.0, 16.0, 32.0, 34.0, 46.0, 74.0, 107.0, 146.0, 130.0, 102.0, 64.0, 39.0, 27.0, 27.0, 36.0, 12.0, 10.0, 7.0, 4.0, 7.0, 3.0, 3.0, 5.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.28109359741211, -25.48111343383789, -24.681135177612305, -23.881155014038086, -23.0811767578125, -22.28119659423828, -21.481216430664062, -20.681238174438477, -19.88125991821289, -19.081279754638672, -18.281301498413086, -17.481321334838867, -16.68134307861328, -15.881362915039062, -15.08138370513916, -14.281404495239258, -13.481424331665039, -12.681445121765137, -11.881465911865234, -11.081485748291016, -10.28150749206543, -9.481527328491211, -8.681548118591309, -7.881568908691406, -7.081589698791504, -6.281610488891602, -5.481631278991699, -4.681651592254639, -3.8816723823547363, -3.081693172454834, -2.2817134857177734, -1.481734275817871, -0.6817550659179688, 0.11822426319122314, 0.918203592300415, 1.7181830406188965, 2.518162250518799, 3.318141460418701, 4.118121147155762, 4.918100357055664, 5.718079566955566, 6.518058776855469, 7.318037986755371, 8.118017196655273, 8.917997360229492, 9.717975616455078, 10.517955780029297, 11.3179349899292, 12.117914199829102, 12.917893409729004, 13.717872619628906, 14.517852783203125, 15.317831039428711, 16.11781120300293, 16.917789459228516, 17.717769622802734, 18.517749786376953, 19.317729949951172, 20.117708206176758, 20.917688369750977, 21.717666625976562, 22.51764678955078, 23.317626953125, 24.117605209350586, 24.917583465576172]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 7.0, 8.0, 8.0, 14.0, 3.0, 10.0, 11.0, 14.0, 10.0, 10.0, 10.0, 18.0, 22.0, 31.0, 25.0, 24.0, 27.0, 27.0, 30.0, 35.0, 36.0, 38.0, 38.0, 37.0, 30.0, 46.0, 37.0, 35.0, 30.0, 26.0, 29.0, 33.0, 31.0, 26.0, 28.0, 18.0, 20.0, 14.0, 11.0, 11.0, 9.0, 11.0, 7.0, 17.0, 14.0, 11.0, 5.0, 1.0, 4.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-12.938288688659668, -12.524230003356934, -12.1101713180542, -11.696112632751465, -11.28205394744873, -10.867995262145996, -10.453936576843262, -10.039877891540527, -9.625819206237793, -9.211760520935059, -8.797701835632324, -8.38364315032959, -7.9695844650268555, -7.555525779724121, -7.141467094421387, -6.727408409118652, -6.313349723815918, -5.899291038513184, -5.485232353210449, -5.071173667907715, -4.6571149826049805, -4.243056297302246, -3.8289976119995117, -3.4149389266967773, -3.000880241394043, -2.5868215560913086, -2.172762870788574, -1.7587041854858398, -1.3446455001831055, -0.9305868148803711, -0.5165281295776367, -0.10246944427490234, 0.31159019470214844, 0.7256488800048828, 1.1397075653076172, 1.5537662506103516, 1.967824935913086, 2.3818836212158203, 2.7959423065185547, 3.210000991821289, 3.6240596771240234, 4.038118362426758, 4.452177047729492, 4.866235733032227, 5.280294418334961, 5.694353103637695, 6.10841178894043, 6.522470474243164, 6.936529159545898, 7.350587844848633, 7.764646530151367, 8.178705215454102, 8.592763900756836, 9.00682258605957, 9.420881271362305, 9.834939956665039, 10.248998641967773, 10.663057327270508, 11.077116012573242, 11.491174697875977, 11.905233383178711, 12.319292068481445, 12.73335075378418, 13.147409439086914, 13.561468124389648]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 6.0, 5.0, 10.0, 13.0, 12.0, 20.0, 28.0, 54.0, 64.0, 89.0, 105.0, 178.0, 293.0, 416.0, 694.0, 1090.0, 1868.0, 3135.0, 5634.0, 10269.0, 18845.0, 35859.0, 71377.0, 148523.0, 295892.0, 231647.0, 108526.0, 53262.0, 27194.0, 14387.0, 8009.0, 4514.0, 2493.0, 1488.0, 879.0, 572.0, 361.0, 236.0, 154.0, 102.0, 72.0, 53.0, 48.0, 18.0, 19.0, 12.0, 7.0, 12.0, 9.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-29.484375, -28.61181640625, -27.7392578125, -26.86669921875, -25.994140625, -25.12158203125, -24.2490234375, -23.37646484375, -22.50390625, -21.63134765625, -20.7587890625, -19.88623046875, -19.013671875, -18.14111328125, -17.2685546875, -16.39599609375, -15.5234375, -14.65087890625, -13.7783203125, -12.90576171875, -12.033203125, -11.16064453125, -10.2880859375, -9.41552734375, -8.54296875, -7.67041015625, -6.7978515625, -5.92529296875, -5.052734375, -4.18017578125, -3.3076171875, -2.43505859375, -1.5625, -0.68994140625, 0.1826171875, 1.05517578125, 1.927734375, 2.80029296875, 3.6728515625, 4.54541015625, 5.41796875, 6.29052734375, 7.1630859375, 8.03564453125, 8.908203125, 9.78076171875, 10.6533203125, 11.52587890625, 12.3984375, 13.27099609375, 14.1435546875, 15.01611328125, 15.888671875, 16.76123046875, 17.6337890625, 18.50634765625, 19.37890625, 20.25146484375, 21.1240234375, 21.99658203125, 22.869140625, 23.74169921875, 24.6142578125, 25.48681640625, 26.359375]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 13.0, 9.0, 7.0, 13.0, 12.0, 13.0, 12.0, 12.0, 18.0, 19.0, 27.0, 26.0, 24.0, 24.0, 29.0, 32.0, 41.0, 37.0, 30.0, 34.0, 53.0, 40.0, 44.0, 32.0, 45.0, 40.0, 28.0, 24.0, 24.0, 32.0, 36.0, 20.0, 20.0, 16.0, 10.0, 14.0, 12.0, 10.0, 7.0, 8.0, 11.0, 14.0, 9.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-12.1953125, -11.800537109375, -11.40576171875, -11.010986328125, -10.6162109375, -10.221435546875, -9.82666015625, -9.431884765625, -9.037109375, -8.642333984375, -8.24755859375, -7.852783203125, -7.4580078125, -7.063232421875, -6.66845703125, -6.273681640625, -5.87890625, -5.484130859375, -5.08935546875, -4.694580078125, -4.2998046875, -3.905029296875, -3.51025390625, -3.115478515625, -2.720703125, -2.325927734375, -1.93115234375, -1.536376953125, -1.1416015625, -0.746826171875, -0.35205078125, 0.042724609375, 0.4375, 0.832275390625, 1.22705078125, 1.621826171875, 2.0166015625, 2.411376953125, 2.80615234375, 3.200927734375, 3.595703125, 3.990478515625, 4.38525390625, 4.780029296875, 5.1748046875, 5.569580078125, 5.96435546875, 6.359130859375, 6.75390625, 7.148681640625, 7.54345703125, 7.938232421875, 8.3330078125, 8.727783203125, 9.12255859375, 9.517333984375, 9.912109375, 10.306884765625, 10.70166015625, 11.096435546875, 11.4912109375, 11.885986328125, 12.28076171875, 12.675537109375, 13.0703125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 7.0, 10.0, 19.0, 13.0, 27.0, 37.0, 49.0, 89.0, 130.0, 178.0, 315.0, 436.0, 588.0, 1050.0, 1751.0, 2789.0, 4615.0, 7801.0, 13943.0, 25937.0, 49058.0, 99125.0, 208936.0, 309512.0, 158450.0, 76453.0, 38763.0, 20551.0, 11278.0, 6497.0, 3826.0, 2243.0, 1449.0, 976.0, 568.0, 362.0, 252.0, 149.0, 96.0, 65.0, 61.0, 38.0, 21.0, 15.0, 5.0, 8.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0], "bins": [-29.59375, -28.7314453125, -27.869140625, -27.0068359375, -26.14453125, -25.2822265625, -24.419921875, -23.5576171875, -22.6953125, -21.8330078125, -20.970703125, -20.1083984375, -19.24609375, -18.3837890625, -17.521484375, -16.6591796875, -15.796875, -14.9345703125, -14.072265625, -13.2099609375, -12.34765625, -11.4853515625, -10.623046875, -9.7607421875, -8.8984375, -8.0361328125, -7.173828125, -6.3115234375, -5.44921875, -4.5869140625, -3.724609375, -2.8623046875, -2.0, -1.1376953125, -0.275390625, 0.5869140625, 1.44921875, 2.3115234375, 3.173828125, 4.0361328125, 4.8984375, 5.7607421875, 6.623046875, 7.4853515625, 8.34765625, 9.2099609375, 10.072265625, 10.9345703125, 11.796875, 12.6591796875, 13.521484375, 14.3837890625, 15.24609375, 16.1083984375, 16.970703125, 17.8330078125, 18.6953125, 19.5576171875, 20.419921875, 21.2822265625, 22.14453125, 23.0068359375, 23.869140625, 24.7314453125, 25.59375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 2.0, 6.0, 1.0, 5.0, 12.0, 10.0, 8.0, 15.0, 13.0, 25.0, 24.0, 26.0, 21.0, 41.0, 37.0, 41.0, 38.0, 41.0, 53.0, 51.0, 50.0, 57.0, 44.0, 39.0, 36.0, 40.0, 39.0, 33.0, 27.0, 27.0, 26.0, 21.0, 14.0, 18.0, 11.0, 13.0, 8.0, 9.0, 8.0, 8.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5078125, -9.16552734375, -8.8232421875, -8.48095703125, -8.138671875, -7.79638671875, -7.4541015625, -7.11181640625, -6.76953125, -6.42724609375, -6.0849609375, -5.74267578125, -5.400390625, -5.05810546875, -4.7158203125, -4.37353515625, -4.03125, -3.68896484375, -3.3466796875, -3.00439453125, -2.662109375, -2.31982421875, -1.9775390625, -1.63525390625, -1.29296875, -0.95068359375, -0.6083984375, -0.26611328125, 0.076171875, 0.41845703125, 0.7607421875, 1.10302734375, 1.4453125, 1.78759765625, 2.1298828125, 2.47216796875, 2.814453125, 3.15673828125, 3.4990234375, 3.84130859375, 4.18359375, 4.52587890625, 4.8681640625, 5.21044921875, 5.552734375, 5.89501953125, 6.2373046875, 6.57958984375, 6.921875, 7.26416015625, 7.6064453125, 7.94873046875, 8.291015625, 8.63330078125, 8.9755859375, 9.31787109375, 9.66015625, 10.00244140625, 10.3447265625, 10.68701171875, 11.029296875, 11.37158203125, 11.7138671875, 12.05615234375, 12.3984375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 3.0, 1.0, 5.0, 9.0, 21.0, 21.0, 23.0, 37.0, 45.0, 86.0, 138.0, 192.0, 282.0, 451.0, 716.0, 1174.0, 2053.0, 3967.0, 8595.0, 23836.0, 89455.0, 703885.0, 155540.0, 35173.0, 11575.0, 5034.0, 2483.0, 1456.0, 811.0, 512.0, 329.0, 226.0, 151.0, 85.0, 52.0, 43.0, 34.0, 17.0, 14.0, 10.0, 4.0, 4.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.8125, -47.109375, -45.40625, -43.703125, -42.0, -40.296875, -38.59375, -36.890625, -35.1875, -33.484375, -31.78125, -30.078125, -28.375, -26.671875, -24.96875, -23.265625, -21.5625, -19.859375, -18.15625, -16.453125, -14.75, -13.046875, -11.34375, -9.640625, -7.9375, -6.234375, -4.53125, -2.828125, -1.125, 0.578125, 2.28125, 3.984375, 5.6875, 7.390625, 9.09375, 10.796875, 12.5, 14.203125, 15.90625, 17.609375, 19.3125, 21.015625, 22.71875, 24.421875, 26.125, 27.828125, 29.53125, 31.234375, 32.9375, 34.640625, 36.34375, 38.046875, 39.75, 41.453125, 43.15625, 44.859375, 46.5625, 48.265625, 49.96875, 51.671875, 53.375, 55.078125, 56.78125, 58.484375, 60.1875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 9.0, 14.0, 21.0, 18.0, 33.0, 32.0, 65.0, 102.0, 258.0, 186.0, 77.0, 69.0, 42.0, 13.0, 10.0, 13.0, 10.0, 8.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.002162933349609375, -0.0020969510078430176, -0.00203096866607666, -0.0019649863243103027, -0.0018990039825439453, -0.0018330216407775879, -0.0017670392990112305, -0.001701056957244873, -0.0016350746154785156, -0.0015690922737121582, -0.0015031099319458008, -0.0014371275901794434, -0.001371145248413086, -0.0013051629066467285, -0.001239180564880371, -0.0011731982231140137, -0.0011072158813476562, -0.0010412335395812988, -0.0009752511978149414, -0.000909268856048584, -0.0008432865142822266, -0.0007773041725158691, -0.0007113218307495117, -0.0006453394889831543, -0.0005793571472167969, -0.0005133748054504395, -0.00044739246368408203, -0.0003814101219177246, -0.0003154277801513672, -0.00024944543838500977, -0.00018346309661865234, -0.00011748075485229492, -5.14984130859375e-05, 1.4483928680419922e-05, 8.046627044677734e-05, 0.00014644861221313477, 0.0002124309539794922, 0.0002784132957458496, 0.00034439563751220703, 0.00041037797927856445, 0.0004763603210449219, 0.0005423426628112793, 0.0006083250045776367, 0.0006743073463439941, 0.0007402896881103516, 0.000806272029876709, 0.0008722543716430664, 0.0009382367134094238, 0.0010042190551757812, 0.0010702013969421387, 0.001136183738708496, 0.0012021660804748535, 0.001268148422241211, 0.0013341307640075684, 0.0014001131057739258, 0.0014660954475402832, 0.0015320777893066406, 0.001598060131072998, 0.0016640424728393555, 0.0017300248146057129, 0.0017960071563720703, 0.0018619894981384277, 0.0019279718399047852, 0.0019939541816711426, 0.0020599365234375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 7.0, 8.0, 13.0, 16.0, 36.0, 49.0, 43.0, 70.0, 108.0, 177.0, 221.0, 313.0, 471.0, 628.0, 1003.0, 1444.0, 2388.0, 3934.0, 7160.0, 15360.0, 42345.0, 215834.0, 646938.0, 66832.0, 21155.0, 9110.0, 4798.0, 2785.0, 1748.0, 1086.0, 727.0, 519.0, 357.0, 240.0, 198.0, 120.0, 79.0, 62.0, 50.0, 40.0, 26.0, 18.0, 7.0, 9.0, 5.0, 10.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.6875, -50.12939453125, -48.5712890625, -47.01318359375, -45.455078125, -43.89697265625, -42.3388671875, -40.78076171875, -39.22265625, -37.66455078125, -36.1064453125, -34.54833984375, -32.990234375, -31.43212890625, -29.8740234375, -28.31591796875, -26.7578125, -25.19970703125, -23.6416015625, -22.08349609375, -20.525390625, -18.96728515625, -17.4091796875, -15.85107421875, -14.29296875, -12.73486328125, -11.1767578125, -9.61865234375, -8.060546875, -6.50244140625, -4.9443359375, -3.38623046875, -1.828125, -0.27001953125, 1.2880859375, 2.84619140625, 4.404296875, 5.96240234375, 7.5205078125, 9.07861328125, 10.63671875, 12.19482421875, 13.7529296875, 15.31103515625, 16.869140625, 18.42724609375, 19.9853515625, 21.54345703125, 23.1015625, 24.65966796875, 26.2177734375, 27.77587890625, 29.333984375, 30.89208984375, 32.4501953125, 34.00830078125, 35.56640625, 37.12451171875, 38.6826171875, 40.24072265625, 41.798828125, 43.35693359375, 44.9150390625, 46.47314453125, 48.03125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 8.0, 3.0, 10.0, 19.0, 16.0, 38.0, 56.0, 61.0, 108.0, 243.0, 126.0, 95.0, 61.0, 39.0, 24.0, 17.0, 13.0, 13.0, 7.0, 4.0, 5.0, 3.0, 4.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.140625, -12.714111328125, -12.28759765625, -11.861083984375, -11.4345703125, -11.008056640625, -10.58154296875, -10.155029296875, -9.728515625, -9.302001953125, -8.87548828125, -8.448974609375, -8.0224609375, -7.595947265625, -7.16943359375, -6.742919921875, -6.31640625, -5.889892578125, -5.46337890625, -5.036865234375, -4.6103515625, -4.183837890625, -3.75732421875, -3.330810546875, -2.904296875, -2.477783203125, -2.05126953125, -1.624755859375, -1.1982421875, -0.771728515625, -0.34521484375, 0.081298828125, 0.5078125, 0.934326171875, 1.36083984375, 1.787353515625, 2.2138671875, 2.640380859375, 3.06689453125, 3.493408203125, 3.919921875, 4.346435546875, 4.77294921875, 5.199462890625, 5.6259765625, 6.052490234375, 6.47900390625, 6.905517578125, 7.33203125, 7.758544921875, 8.18505859375, 8.611572265625, 9.0380859375, 9.464599609375, 9.89111328125, 10.317626953125, 10.744140625, 11.170654296875, 11.59716796875, 12.023681640625, 12.4501953125, 12.876708984375, 13.30322265625, 13.729736328125, 14.15625]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 8.0, 4.0, 9.0, 11.0, 12.0, 28.0, 27.0, 37.0, 60.0, 89.0, 137.0, 136.0, 122.0, 67.0, 54.0, 41.0, 29.0, 23.0, 25.0, 13.0, 18.0, 11.0, 8.0, 7.0, 7.0, 4.0, 3.0, 4.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.508560180664062, -19.751426696777344, -18.994293212890625, -18.23716163635254, -17.48002815246582, -16.7228946685791, -15.9657621383667, -15.208629608154297, -14.451496124267578, -13.69436264038086, -12.937230110168457, -12.180097579956055, -11.422964096069336, -10.665830612182617, -9.908698081970215, -9.151565551757812, -8.394432067871094, -7.637299060821533, -6.880166053771973, -6.123033046722412, -5.365900039672852, -4.608767032623291, -3.8516340255737305, -3.09450101852417, -2.3373680114746094, -1.5802350044250488, -0.8231019973754883, -0.06596899032592773, 0.6911640167236328, 1.4482970237731934, 2.205430030822754, 2.9625630378723145, 3.719694137573242, 4.476827144622803, 5.233960151672363, 5.991093158721924, 6.748226165771484, 7.505359172821045, 8.262492179870605, 9.019624710083008, 9.776758193969727, 10.533891677856445, 11.291024208068848, 12.04815673828125, 12.805290222167969, 13.562423706054688, 14.31955623626709, 15.076688766479492, 15.833822250366211, 16.59095573425293, 17.348087310791016, 18.105220794677734, 18.862354278564453, 19.619487762451172, 20.37662124633789, 21.133752822875977, 21.890886306762695, 22.648019790649414, 23.4051513671875, 24.16228485107422, 24.919418334960938, 25.676551818847656, 26.433685302734375, 27.19081687927246, 27.94795036315918]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 4.0, 6.0, 6.0, 10.0, 13.0, 14.0, 22.0, 23.0, 19.0, 15.0, 18.0, 23.0, 33.0, 19.0, 25.0, 39.0, 34.0, 30.0, 50.0, 28.0, 36.0, 40.0, 31.0, 39.0, 24.0, 42.0, 33.0, 31.0, 36.0, 28.0, 32.0, 25.0, 29.0, 21.0, 16.0, 7.0, 19.0, 7.0, 15.0, 11.0, 9.0, 8.0, 4.0, 5.0, 5.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 0.0, 0.0, 2.0], "bins": [-13.7586030960083, -13.324723243713379, -12.890843391418457, -12.456963539123535, -12.023083686828613, -11.589203834533691, -11.155324935913086, -10.721445083618164, -10.287565231323242, -9.85368537902832, -9.419805526733398, -8.985925674438477, -8.552045822143555, -8.118165969848633, -7.684286594390869, -7.250406742095947, -6.816526412963867, -6.382646560668945, -5.948766708374023, -5.514886856079102, -5.08100700378418, -4.647127151489258, -4.213247776031494, -3.7793679237365723, -3.3454880714416504, -2.9116082191467285, -2.4777283668518066, -2.043848752975464, -1.609968900680542, -1.1760890483856201, -0.7422094345092773, -0.30832958221435547, 0.1255502700805664, 0.5594300627708435, 0.9933098554611206, 1.427189588546753, 1.8610694408416748, 2.2949492931365967, 2.7288289070129395, 3.1627087593078613, 3.596588611602783, 4.030468463897705, 4.464348316192627, 4.898227691650391, 5.3321075439453125, 5.765987396240234, 6.199867248535156, 6.633747100830078, 7.067626953125, 7.501506805419922, 7.935386657714844, 8.369266510009766, 8.803146362304688, 9.23702621459961, 9.670906066894531, 10.104785919189453, 10.538665771484375, 10.972545623779297, 11.406425476074219, 11.84030532836914, 12.274185180664062, 12.708065032958984, 13.141944885253906, 13.575824737548828, 14.009703636169434]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 10.0, 24.0, 26.0, 40.0, 71.0, 90.0, 131.0, 219.0, 306.0, 454.0, 652.0, 997.0, 1499.0, 2261.0, 3260.0, 4988.0, 7618.0, 12068.0, 18773.0, 30534.0, 52786.0, 97166.0, 221990.0, 832379.0, 1955135.0, 565600.0, 177822.0, 84991.0, 46372.0, 26872.0, 16624.0, 10683.0, 6917.0, 4730.0, 3186.0, 2114.0, 1466.0, 1029.0, 705.0, 521.0, 369.0, 223.0, 171.0, 120.0, 84.0, 67.0, 42.0, 27.0, 24.0, 18.0, 6.0, 9.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0], "bins": [-19.78125, -19.130126953125, -18.47900390625, -17.827880859375, -17.1767578125, -16.525634765625, -15.87451171875, -15.223388671875, -14.572265625, -13.921142578125, -13.27001953125, -12.618896484375, -11.9677734375, -11.316650390625, -10.66552734375, -10.014404296875, -9.36328125, -8.712158203125, -8.06103515625, -7.409912109375, -6.7587890625, -6.107666015625, -5.45654296875, -4.805419921875, -4.154296875, -3.503173828125, -2.85205078125, -2.200927734375, -1.5498046875, -0.898681640625, -0.24755859375, 0.403564453125, 1.0546875, 1.705810546875, 2.35693359375, 3.008056640625, 3.6591796875, 4.310302734375, 4.96142578125, 5.612548828125, 6.263671875, 6.914794921875, 7.56591796875, 8.217041015625, 8.8681640625, 9.519287109375, 10.17041015625, 10.821533203125, 11.47265625, 12.123779296875, 12.77490234375, 13.426025390625, 14.0771484375, 14.728271484375, 15.37939453125, 16.030517578125, 16.681640625, 17.332763671875, 17.98388671875, 18.635009765625, 19.2861328125, 19.937255859375, 20.58837890625, 21.239501953125, 21.890625]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 6.0, 4.0, 9.0, 2.0, 7.0, 8.0, 12.0, 17.0, 15.0, 14.0, 22.0, 24.0, 21.0, 21.0, 26.0, 24.0, 33.0, 27.0, 41.0, 38.0, 38.0, 46.0, 31.0, 34.0, 50.0, 38.0, 38.0, 26.0, 30.0, 37.0, 34.0, 32.0, 29.0, 21.0, 24.0, 17.0, 16.0, 14.0, 16.0, 13.0, 7.0, 10.0, 10.0, 7.0, 5.0, 1.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0], "bins": [-8.203125, -7.9493408203125, -7.695556640625, -7.4417724609375, -7.18798828125, -6.9342041015625, -6.680419921875, -6.4266357421875, -6.1728515625, -5.9190673828125, -5.665283203125, -5.4114990234375, -5.15771484375, -4.9039306640625, -4.650146484375, -4.3963623046875, -4.142578125, -3.8887939453125, -3.635009765625, -3.3812255859375, -3.12744140625, -2.8736572265625, -2.619873046875, -2.3660888671875, -2.1123046875, -1.8585205078125, -1.604736328125, -1.3509521484375, -1.09716796875, -0.8433837890625, -0.589599609375, -0.3358154296875, -0.08203125, 0.1717529296875, 0.425537109375, 0.6793212890625, 0.93310546875, 1.1868896484375, 1.440673828125, 1.6944580078125, 1.9482421875, 2.2020263671875, 2.455810546875, 2.7095947265625, 2.96337890625, 3.2171630859375, 3.470947265625, 3.7247314453125, 3.978515625, 4.2322998046875, 4.486083984375, 4.7398681640625, 4.99365234375, 5.2474365234375, 5.501220703125, 5.7550048828125, 6.0087890625, 6.2625732421875, 6.516357421875, 6.7701416015625, 7.02392578125, 7.2777099609375, 7.531494140625, 7.7852783203125, 8.0390625]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 7.0, 9.0, 19.0, 38.0, 52.0, 69.0, 71.0, 121.0, 189.0, 302.0, 407.0, 624.0, 901.0, 1410.0, 2213.0, 3425.0, 5283.0, 8743.0, 14149.0, 25214.0, 45581.0, 88765.0, 194801.0, 512679.0, 1826979.0, 905887.0, 290828.0, 124410.0, 60779.0, 32445.0, 18386.0, 10899.0, 6621.0, 4121.0, 2654.0, 1769.0, 1163.0, 747.0, 485.0, 351.0, 207.0, 177.0, 99.0, 68.0, 46.0, 27.0, 24.0, 15.0, 11.0, 9.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.0, -17.4326171875, -16.865234375, -16.2978515625, -15.73046875, -15.1630859375, -14.595703125, -14.0283203125, -13.4609375, -12.8935546875, -12.326171875, -11.7587890625, -11.19140625, -10.6240234375, -10.056640625, -9.4892578125, -8.921875, -8.3544921875, -7.787109375, -7.2197265625, -6.65234375, -6.0849609375, -5.517578125, -4.9501953125, -4.3828125, -3.8154296875, -3.248046875, -2.6806640625, -2.11328125, -1.5458984375, -0.978515625, -0.4111328125, 0.15625, 0.7236328125, 1.291015625, 1.8583984375, 2.42578125, 2.9931640625, 3.560546875, 4.1279296875, 4.6953125, 5.2626953125, 5.830078125, 6.3974609375, 6.96484375, 7.5322265625, 8.099609375, 8.6669921875, 9.234375, 9.8017578125, 10.369140625, 10.9365234375, 11.50390625, 12.0712890625, 12.638671875, 13.2060546875, 13.7734375, 14.3408203125, 14.908203125, 15.4755859375, 16.04296875, 16.6103515625, 17.177734375, 17.7451171875, 18.3125]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 4.0, 7.0, 4.0, 16.0, 15.0, 16.0, 20.0, 20.0, 28.0, 32.0, 38.0, 57.0, 62.0, 97.0, 114.0, 123.0, 166.0, 193.0, 247.0, 303.0, 353.0, 372.0, 319.0, 293.0, 221.0, 181.0, 161.0, 118.0, 103.0, 83.0, 61.0, 38.0, 42.0, 26.0, 36.0, 22.0, 16.0, 16.0, 5.0, 15.0, 4.0, 9.0, 2.0, 8.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.90234375, -4.747314453125, -4.59228515625, -4.437255859375, -4.2822265625, -4.127197265625, -3.97216796875, -3.817138671875, -3.662109375, -3.507080078125, -3.35205078125, -3.197021484375, -3.0419921875, -2.886962890625, -2.73193359375, -2.576904296875, -2.421875, -2.266845703125, -2.11181640625, -1.956787109375, -1.8017578125, -1.646728515625, -1.49169921875, -1.336669921875, -1.181640625, -1.026611328125, -0.87158203125, -0.716552734375, -0.5615234375, -0.406494140625, -0.25146484375, -0.096435546875, 0.05859375, 0.213623046875, 0.36865234375, 0.523681640625, 0.6787109375, 0.833740234375, 0.98876953125, 1.143798828125, 1.298828125, 1.453857421875, 1.60888671875, 1.763916015625, 1.9189453125, 2.073974609375, 2.22900390625, 2.384033203125, 2.5390625, 2.694091796875, 2.84912109375, 3.004150390625, 3.1591796875, 3.314208984375, 3.46923828125, 3.624267578125, 3.779296875, 3.934326171875, 4.08935546875, 4.244384765625, 4.3994140625, 4.554443359375, 4.70947265625, 4.864501953125, 5.01953125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 5.0, 6.0, 9.0, 14.0, 9.0, 18.0, 23.0, 36.0, 59.0, 71.0, 104.0, 177.0, 146.0, 80.0, 59.0, 47.0, 36.0, 27.0, 21.0, 5.0, 12.0, 9.0, 3.0, 5.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.631935119628906, -19.035533905029297, -18.439132690429688, -17.842729568481445, -17.246328353881836, -16.649927139282227, -16.053525924682617, -15.457124710083008, -14.860722541809082, -14.264321327209473, -13.667919158935547, -13.071517944335938, -12.475116729736328, -11.878714561462402, -11.282313346862793, -10.685911178588867, -10.089509963989258, -9.493108749389648, -8.896706581115723, -8.300305366516113, -7.703903675079346, -7.107501983642578, -6.511100769042969, -5.914699077606201, -5.318297386169434, -4.721895694732666, -4.125494003295898, -3.529092788696289, -2.9326910972595215, -2.336289405822754, -1.7398879528045654, -1.143486499786377, -0.5470848083496094, 0.04931676387786865, 0.6457183361053467, 1.2421199083328247, 1.8385214805603027, 2.4349231719970703, 3.031324625015259, 3.6277260780334473, 4.224127769470215, 4.820529460906982, 5.41693115234375, 6.013332366943359, 6.609734058380127, 7.2061357498168945, 7.802536964416504, 8.39893913269043, 8.995340347290039, 9.591741561889648, 10.188143730163574, 10.784544944763184, 11.38094711303711, 11.977348327636719, 12.573749542236328, 13.170150756835938, 13.766552925109863, 14.362954139709473, 14.959356307983398, 15.555757522583008, 16.152158737182617, 16.74856185913086, 17.34496307373047, 17.941364288330078, 18.537765502929688]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 9.0, 7.0, 12.0, 16.0, 9.0, 11.0, 12.0, 18.0, 13.0, 19.0, 20.0, 29.0, 28.0, 30.0, 25.0, 25.0, 39.0, 25.0, 35.0, 31.0, 45.0, 24.0, 43.0, 30.0, 45.0, 43.0, 25.0, 22.0, 33.0, 26.0, 34.0, 22.0, 22.0, 36.0, 19.0, 21.0, 10.0, 16.0, 9.0, 9.0, 10.0, 9.0, 6.0, 6.0, 6.0, 3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.3851900100708, -8.105656623840332, -7.826122283935547, -7.54658842086792, -7.267054557800293, -6.987520694732666, -6.707986831665039, -6.42845344543457, -6.148919105529785, -5.869385242462158, -5.589851379394531, -5.310317516326904, -5.030783653259277, -4.75124979019165, -4.471715927124023, -4.192182540893555, -3.9126486778259277, -3.633114814758301, -3.353580951690674, -3.074047088623047, -2.79451322555542, -2.514979362487793, -2.235445737838745, -1.9559118747711182, -1.6763780117034912, -1.3968441486358643, -1.1173102855682373, -0.8377765417098999, -0.558242678642273, -0.278708815574646, 0.0008249282836914062, 0.28035879135131836, 0.5598926544189453, 0.8394265174865723, 1.1189603805541992, 1.3984941244125366, 1.6780279874801636, 1.9575618505477905, 2.237095594406128, 2.516629457473755, 2.796163320541382, 3.075697183609009, 3.3552310466766357, 3.6347646713256836, 3.9142985343933105, 4.1938323974609375, 4.4733662605285645, 4.752900123596191, 5.032433986663818, 5.311967849731445, 5.591501712799072, 5.871035575866699, 6.150569438934326, 6.430103302001953, 6.709636688232422, 6.989171028137207, 7.268704414367676, 7.548238277435303, 7.82777214050293, 8.107305526733398, 8.386839866638184, 8.666373252868652, 8.945907592773438, 9.225440979003906, 9.504975318908691]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 3.0, 5.0, 11.0, 13.0, 20.0, 43.0, 67.0, 86.0, 107.0, 186.0, 228.0, 303.0, 524.0, 732.0, 1095.0, 1572.0, 2387.0, 3690.0, 5993.0, 9882.0, 17352.0, 31979.0, 64420.0, 147643.0, 359000.0, 216426.0, 88110.0, 42182.0, 21961.0, 12239.0, 7259.0, 4547.0, 2866.0, 1752.0, 1192.0, 814.0, 508.0, 381.0, 287.0, 183.0, 139.0, 102.0, 55.0, 58.0, 49.0, 31.0, 20.0, 20.0, 11.0, 11.0, 5.0, 4.0, 1.0, 4.0, 1.0], "bins": [-4.609375, -4.47259521484375, -4.3358154296875, -4.19903564453125, -4.062255859375, -3.92547607421875, -3.7886962890625, -3.65191650390625, -3.51513671875, -3.37835693359375, -3.2415771484375, -3.10479736328125, -2.968017578125, -2.83123779296875, -2.6944580078125, -2.55767822265625, -2.4208984375, -2.28411865234375, -2.1473388671875, -2.01055908203125, -1.873779296875, -1.73699951171875, -1.6002197265625, -1.46343994140625, -1.32666015625, -1.18988037109375, -1.0531005859375, -0.91632080078125, -0.779541015625, -0.64276123046875, -0.5059814453125, -0.36920166015625, -0.232421875, -0.09564208984375, 0.0411376953125, 0.17791748046875, 0.314697265625, 0.45147705078125, 0.5882568359375, 0.72503662109375, 0.86181640625, 0.99859619140625, 1.1353759765625, 1.27215576171875, 1.408935546875, 1.54571533203125, 1.6824951171875, 1.81927490234375, 1.9560546875, 2.09283447265625, 2.2296142578125, 2.36639404296875, 2.503173828125, 2.63995361328125, 2.7767333984375, 2.91351318359375, 3.05029296875, 3.18707275390625, 3.3238525390625, 3.46063232421875, 3.597412109375, 3.73419189453125, 3.8709716796875, 4.00775146484375, 4.14453125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 5.0, 3.0, 3.0, 9.0, 11.0, 3.0, 13.0, 16.0, 14.0, 7.0, 18.0, 22.0, 24.0, 28.0, 26.0, 28.0, 30.0, 31.0, 26.0, 34.0, 37.0, 28.0, 38.0, 47.0, 40.0, 46.0, 27.0, 32.0, 35.0, 29.0, 26.0, 28.0, 41.0, 25.0, 18.0, 29.0, 25.0, 17.0, 14.0, 10.0, 10.0, 11.0, 7.0, 11.0, 5.0, 2.0, 8.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-9.15625, -8.8624267578125, -8.568603515625, -8.2747802734375, -7.98095703125, -7.6871337890625, -7.393310546875, -7.0994873046875, -6.8056640625, -6.5118408203125, -6.218017578125, -5.9241943359375, -5.63037109375, -5.3365478515625, -5.042724609375, -4.7489013671875, -4.455078125, -4.1612548828125, -3.867431640625, -3.5736083984375, -3.27978515625, -2.9859619140625, -2.692138671875, -2.3983154296875, -2.1044921875, -1.8106689453125, -1.516845703125, -1.2230224609375, -0.92919921875, -0.6353759765625, -0.341552734375, -0.0477294921875, 0.24609375, 0.5399169921875, 0.833740234375, 1.1275634765625, 1.42138671875, 1.7152099609375, 2.009033203125, 2.3028564453125, 2.5966796875, 2.8905029296875, 3.184326171875, 3.4781494140625, 3.77197265625, 4.0657958984375, 4.359619140625, 4.6534423828125, 4.947265625, 5.2410888671875, 5.534912109375, 5.8287353515625, 6.12255859375, 6.4163818359375, 6.710205078125, 7.0040283203125, 7.2978515625, 7.5916748046875, 7.885498046875, 8.1793212890625, 8.47314453125, 8.7669677734375, 9.060791015625, 9.3546142578125, 9.6484375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [7.0, 1.0, 3.0, 2.0, 5.0, 9.0, 11.0, 19.0, 14.0, 23.0, 32.0, 62.0, 103.0, 100.0, 147.0, 208.0, 373.0, 427.0, 752.0, 953.0, 1552.0, 2414.0, 3825.0, 6457.0, 11512.0, 22034.0, 47457.0, 122062.0, 445017.0, 237636.0, 74188.0, 32485.0, 16149.0, 8562.0, 5028.0, 3143.0, 1931.0, 1265.0, 796.0, 580.0, 346.0, 248.0, 181.0, 155.0, 74.0, 56.0, 43.0, 31.0, 26.0, 20.0, 15.0, 12.0, 8.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.28515625, -5.10137939453125, -4.9176025390625, -4.73382568359375, -4.550048828125, -4.36627197265625, -4.1824951171875, -3.99871826171875, -3.81494140625, -3.63116455078125, -3.4473876953125, -3.26361083984375, -3.079833984375, -2.89605712890625, -2.7122802734375, -2.52850341796875, -2.3447265625, -2.16094970703125, -1.9771728515625, -1.79339599609375, -1.609619140625, -1.42584228515625, -1.2420654296875, -1.05828857421875, -0.87451171875, -0.69073486328125, -0.5069580078125, -0.32318115234375, -0.139404296875, 0.04437255859375, 0.2281494140625, 0.41192626953125, 0.595703125, 0.77947998046875, 0.9632568359375, 1.14703369140625, 1.330810546875, 1.51458740234375, 1.6983642578125, 1.88214111328125, 2.06591796875, 2.24969482421875, 2.4334716796875, 2.61724853515625, 2.801025390625, 2.98480224609375, 3.1685791015625, 3.35235595703125, 3.5361328125, 3.71990966796875, 3.9036865234375, 4.08746337890625, 4.271240234375, 4.45501708984375, 4.6387939453125, 4.82257080078125, 5.00634765625, 5.19012451171875, 5.3739013671875, 5.55767822265625, 5.741455078125, 5.92523193359375, 6.1090087890625, 6.29278564453125, 6.4765625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 2.0, 3.0, 3.0, 9.0, 3.0, 7.0, 13.0, 8.0, 14.0, 13.0, 12.0, 17.0, 19.0, 26.0, 29.0, 36.0, 33.0, 41.0, 53.0, 45.0, 44.0, 47.0, 42.0, 33.0, 40.0, 37.0, 43.0, 47.0, 39.0, 29.0, 30.0, 29.0, 37.0, 28.0, 13.0, 10.0, 13.0, 10.0, 16.0, 9.0, 7.0, 6.0, 4.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.62109375, -6.39678955078125, -6.1724853515625, -5.94818115234375, -5.723876953125, -5.49957275390625, -5.2752685546875, -5.05096435546875, -4.82666015625, -4.60235595703125, -4.3780517578125, -4.15374755859375, -3.929443359375, -3.70513916015625, -3.4808349609375, -3.25653076171875, -3.0322265625, -2.80792236328125, -2.5836181640625, -2.35931396484375, -2.135009765625, -1.91070556640625, -1.6864013671875, -1.46209716796875, -1.23779296875, -1.01348876953125, -0.7891845703125, -0.56488037109375, -0.340576171875, -0.11627197265625, 0.1080322265625, 0.33233642578125, 0.556640625, 0.78094482421875, 1.0052490234375, 1.22955322265625, 1.453857421875, 1.67816162109375, 1.9024658203125, 2.12677001953125, 2.35107421875, 2.57537841796875, 2.7996826171875, 3.02398681640625, 3.248291015625, 3.47259521484375, 3.6968994140625, 3.92120361328125, 4.1455078125, 4.36981201171875, 4.5941162109375, 4.81842041015625, 5.042724609375, 5.26702880859375, 5.4913330078125, 5.71563720703125, 5.93994140625, 6.16424560546875, 6.3885498046875, 6.61285400390625, 6.837158203125, 7.06146240234375, 7.2857666015625, 7.51007080078125, 7.734375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 11.0, 7.0, 17.0, 15.0, 22.0, 29.0, 36.0, 70.0, 67.0, 94.0, 142.0, 245.0, 323.0, 464.0, 662.0, 1079.0, 1549.0, 2442.0, 3958.0, 6802.0, 11849.0, 22814.0, 47633.0, 119263.0, 503841.0, 191951.0, 66238.0, 30010.0, 15005.0, 8372.0, 4888.0, 3024.0, 1832.0, 1203.0, 788.0, 550.0, 361.0, 241.0, 162.0, 145.0, 86.0, 73.0, 55.0, 37.0, 22.0, 18.0, 16.0, 9.0, 7.0, 8.0, 8.0, 4.0, 3.0], "bins": [-1.3447265625, -1.3070526123046875, -1.269378662109375, -1.2317047119140625, -1.19403076171875, -1.1563568115234375, -1.118682861328125, -1.0810089111328125, -1.0433349609375, -1.0056610107421875, -0.967987060546875, -0.9303131103515625, -0.89263916015625, -0.8549652099609375, -0.817291259765625, -0.7796173095703125, -0.741943359375, -0.7042694091796875, -0.666595458984375, -0.6289215087890625, -0.59124755859375, -0.5535736083984375, -0.515899658203125, -0.4782257080078125, -0.4405517578125, -0.4028778076171875, -0.365203857421875, -0.3275299072265625, -0.28985595703125, -0.2521820068359375, -0.214508056640625, -0.1768341064453125, -0.13916015625, -0.1014862060546875, -0.063812255859375, -0.0261383056640625, 0.01153564453125, 0.0492095947265625, 0.086883544921875, 0.1245574951171875, 0.1622314453125, 0.1999053955078125, 0.237579345703125, 0.2752532958984375, 0.31292724609375, 0.3506011962890625, 0.388275146484375, 0.4259490966796875, 0.463623046875, 0.5012969970703125, 0.538970947265625, 0.5766448974609375, 0.61431884765625, 0.6519927978515625, 0.689666748046875, 0.7273406982421875, 0.7650146484375, 0.8026885986328125, 0.840362548828125, 0.8780364990234375, 0.91571044921875, 0.9533843994140625, 0.991058349609375, 1.0287322998046875, 1.06640625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 9.0, 9.0, 14.0, 22.0, 24.0, 31.0, 43.0, 66.0, 91.0, 125.0, 158.0, 112.0, 93.0, 59.0, 42.0, 25.0, 19.0, 20.0, 6.0, 7.0, 2.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010883808135986328, -0.00010486319661140442, -0.00010088831186294556, -9.69134271144867e-05, -9.293854236602783e-05, -8.896365761756897e-05, -8.498877286911011e-05, -8.101388812065125e-05, -7.703900337219238e-05, -7.306411862373352e-05, -6.908923387527466e-05, -6.51143491268158e-05, -6.113946437835693e-05, -5.716457962989807e-05, -5.318969488143921e-05, -4.921481013298035e-05, -4.5239925384521484e-05, -4.126504063606262e-05, -3.729015588760376e-05, -3.33152711391449e-05, -2.9340386390686035e-05, -2.5365501642227173e-05, -2.139061689376831e-05, -1.7415732145309448e-05, -1.3440847396850586e-05, -9.465962648391724e-06, -5.491077899932861e-06, -1.516193151473999e-06, 2.4586915969848633e-06, 6.433576345443726e-06, 1.0408461093902588e-05, 1.438334584236145e-05, 1.8358230590820312e-05, 2.2333115339279175e-05, 2.6308000087738037e-05, 3.02828848361969e-05, 3.425776958465576e-05, 3.8232654333114624e-05, 4.2207539081573486e-05, 4.618242383003235e-05, 5.015730857849121e-05, 5.413219332695007e-05, 5.8107078075408936e-05, 6.20819628238678e-05, 6.605684757232666e-05, 7.003173232078552e-05, 7.400661706924438e-05, 7.798150181770325e-05, 8.195638656616211e-05, 8.593127131462097e-05, 8.990615606307983e-05, 9.38810408115387e-05, 9.785592555999756e-05, 0.00010183081030845642, 0.00010580569505691528, 0.00010978057980537415, 0.00011375546455383301, 0.00011773034930229187, 0.00012170523405075073, 0.0001256801187992096, 0.00012965500354766846, 0.00013362988829612732, 0.00013760477304458618, 0.00014157965779304504, 0.0001455545425415039]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [4.0, 4.0, 2.0, 6.0, 4.0, 9.0, 16.0, 21.0, 30.0, 47.0, 52.0, 80.0, 113.0, 190.0, 221.0, 349.0, 513.0, 707.0, 1074.0, 1455.0, 2284.0, 3457.0, 5209.0, 8250.0, 13390.0, 22713.0, 40173.0, 79156.0, 212170.0, 424412.0, 108134.0, 51364.0, 28245.0, 16384.0, 9769.0, 6317.0, 4042.0, 2546.0, 1817.0, 1105.0, 753.0, 607.0, 443.0, 274.0, 197.0, 153.0, 90.0, 63.0, 48.0, 30.0, 21.0, 18.0, 17.0, 6.0, 4.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.193359375, -2.11822509765625, -2.0430908203125, -1.96795654296875, -1.892822265625, -1.81768798828125, -1.7425537109375, -1.66741943359375, -1.59228515625, -1.51715087890625, -1.4420166015625, -1.36688232421875, -1.291748046875, -1.21661376953125, -1.1414794921875, -1.06634521484375, -0.9912109375, -0.91607666015625, -0.8409423828125, -0.76580810546875, -0.690673828125, -0.61553955078125, -0.5404052734375, -0.46527099609375, -0.39013671875, -0.31500244140625, -0.2398681640625, -0.16473388671875, -0.089599609375, -0.01446533203125, 0.0606689453125, 0.13580322265625, 0.2109375, 0.28607177734375, 0.3612060546875, 0.43634033203125, 0.511474609375, 0.58660888671875, 0.6617431640625, 0.73687744140625, 0.81201171875, 0.88714599609375, 0.9622802734375, 1.03741455078125, 1.112548828125, 1.18768310546875, 1.2628173828125, 1.33795166015625, 1.4130859375, 1.48822021484375, 1.5633544921875, 1.63848876953125, 1.713623046875, 1.78875732421875, 1.8638916015625, 1.93902587890625, 2.01416015625, 2.08929443359375, 2.1644287109375, 2.23956298828125, 2.314697265625, 2.38983154296875, 2.4649658203125, 2.54010009765625, 2.615234375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 4.0, 6.0, 7.0, 6.0, 5.0, 8.0, 5.0, 8.0, 12.0, 9.0, 22.0, 21.0, 23.0, 19.0, 34.0, 33.0, 27.0, 41.0, 47.0, 70.0, 73.0, 82.0, 65.0, 62.0, 50.0, 32.0, 31.0, 27.0, 23.0, 33.0, 16.0, 15.0, 20.0, 13.0, 12.0, 9.0, 6.0, 7.0, 4.0, 3.0, 1.0, 8.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.73291015625, -0.71209716796875, -0.6912841796875, -0.67047119140625, -0.649658203125, -0.62884521484375, -0.6080322265625, -0.58721923828125, -0.56640625, -0.54559326171875, -0.5247802734375, -0.50396728515625, -0.483154296875, -0.46234130859375, -0.4415283203125, -0.42071533203125, -0.39990234375, -0.37908935546875, -0.3582763671875, -0.33746337890625, -0.316650390625, -0.29583740234375, -0.2750244140625, -0.25421142578125, -0.2333984375, -0.21258544921875, -0.1917724609375, -0.17095947265625, -0.150146484375, -0.12933349609375, -0.1085205078125, -0.08770751953125, -0.06689453125, -0.04608154296875, -0.0252685546875, -0.00445556640625, 0.016357421875, 0.03717041015625, 0.0579833984375, 0.07879638671875, 0.099609375, 0.12042236328125, 0.1412353515625, 0.16204833984375, 0.182861328125, 0.20367431640625, 0.2244873046875, 0.24530029296875, 0.26611328125, 0.28692626953125, 0.3077392578125, 0.32855224609375, 0.349365234375, 0.37017822265625, 0.3909912109375, 0.41180419921875, 0.4326171875, 0.45343017578125, 0.4742431640625, 0.49505615234375, 0.515869140625, 0.53668212890625, 0.5574951171875, 0.57830810546875, 0.59912109375]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 2.0, 8.0, 6.0, 16.0, 6.0, 12.0, 23.0, 31.0, 43.0, 71.0, 90.0, 150.0, 172.0, 100.0, 74.0, 50.0, 35.0, 30.0, 20.0, 14.0, 14.0, 8.0, 3.0, 4.0, 2.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.981359481811523, -19.361576080322266, -18.74179458618164, -18.122011184692383, -17.502227783203125, -16.882444381713867, -16.26266098022461, -15.642879486083984, -15.023096084594727, -14.403312683105469, -13.783530235290527, -13.163747787475586, -12.543964385986328, -11.92418098449707, -11.304398536682129, -10.684616088867188, -10.06483268737793, -9.445049285888672, -8.82526683807373, -8.205484390258789, -7.585700988769531, -6.965918064117432, -6.346135139465332, -5.726352214813232, -5.106569290161133, -4.486786365509033, -3.8670034408569336, -3.247220516204834, -2.6274375915527344, -2.0076546669006348, -1.3878717422485352, -0.7680888175964355, -0.14830780029296875, 0.47147512435913086, 1.0912580490112305, 1.71104097366333, 2.3308238983154297, 2.9506068229675293, 3.570389747619629, 4.1901726722717285, 4.809955596923828, 5.429738521575928, 6.049521446228027, 6.669304370880127, 7.289087295532227, 7.908870220184326, 8.528653144836426, 9.148435592651367, 9.768218994140625, 10.388002395629883, 11.007784843444824, 11.627567291259766, 12.247350692749023, 12.867134094238281, 13.486916542053223, 14.106698989868164, 14.726482391357422, 15.34626579284668, 15.966048240661621, 16.585830688476562, 17.20561408996582, 17.825397491455078, 18.445178985595703, 19.06496238708496, 19.68474578857422]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 9.0, 12.0, 12.0, 10.0, 13.0, 12.0, 17.0, 17.0, 20.0, 20.0, 22.0, 32.0, 29.0, 30.0, 30.0, 34.0, 30.0, 25.0, 41.0, 36.0, 35.0, 40.0, 34.0, 36.0, 41.0, 24.0, 38.0, 29.0, 28.0, 26.0, 24.0, 30.0, 20.0, 28.0, 17.0, 12.0, 11.0, 10.0, 11.0, 9.0, 6.0, 9.0, 5.0, 4.0, 5.0, 3.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.137797355651855, -8.844019889831543, -8.55024242401123, -8.256464958190918, -7.9626874923706055, -7.668910026550293, -7.3751325607299805, -7.081355094909668, -6.7875776290893555, -6.493800163269043, -6.2000226974487305, -5.906245231628418, -5.6124677658081055, -5.318690299987793, -5.0249128341674805, -4.731135368347168, -4.437357425689697, -4.143579959869385, -3.8498024940490723, -3.5560250282287598, -3.2622475624084473, -2.9684700965881348, -2.674692392349243, -2.3809149265289307, -2.087137460708618, -1.7933599948883057, -1.4995825290679932, -1.2058049440383911, -0.9120274782180786, -0.6182500123977661, -0.32447242736816406, -0.030694961547851562, 0.26308250427246094, 0.5568599700927734, 0.8506374955177307, 1.144415020942688, 1.4381924867630005, 1.731969952583313, 2.025747537612915, 2.3195250034332275, 2.61330246925354, 2.9070799350738525, 3.200857400894165, 3.4946351051330566, 3.788412570953369, 4.082190036773682, 4.375967502593994, 4.669744968414307, 4.963522434234619, 5.257299900054932, 5.551077365875244, 5.844854831695557, 6.138632297515869, 6.432409763336182, 6.726187705993652, 7.019965171813965, 7.313742637634277, 7.60752010345459, 7.901297569274902, 8.195075035095215, 8.488852500915527, 8.78262996673584, 9.076407432556152, 9.370184898376465, 9.663962364196777]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 6.0, 7.0, 9.0, 9.0, 17.0, 28.0, 43.0, 38.0, 78.0, 103.0, 129.0, 209.0, 348.0, 543.0, 769.0, 1240.0, 1854.0, 2938.0, 4771.0, 7743.0, 12611.0, 21578.0, 36733.0, 64082.0, 113851.0, 204651.0, 240512.0, 142780.0, 78983.0, 45223.0, 26117.0, 15662.0, 9371.0, 5730.0, 3507.0, 2230.0, 1398.0, 946.0, 609.0, 380.0, 224.0, 175.0, 94.0, 58.0, 56.0, 36.0, 25.0, 17.0, 17.0, 9.0, 4.0, 3.0, 4.0, 5.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-14.5546875, -14.0880126953125, -13.621337890625, -13.1546630859375, -12.68798828125, -12.2213134765625, -11.754638671875, -11.2879638671875, -10.8212890625, -10.3546142578125, -9.887939453125, -9.4212646484375, -8.95458984375, -8.4879150390625, -8.021240234375, -7.5545654296875, -7.087890625, -6.6212158203125, -6.154541015625, -5.6878662109375, -5.22119140625, -4.7545166015625, -4.287841796875, -3.8211669921875, -3.3544921875, -2.8878173828125, -2.421142578125, -1.9544677734375, -1.48779296875, -1.0211181640625, -0.554443359375, -0.0877685546875, 0.37890625, 0.8455810546875, 1.312255859375, 1.7789306640625, 2.24560546875, 2.7122802734375, 3.178955078125, 3.6456298828125, 4.1123046875, 4.5789794921875, 5.045654296875, 5.5123291015625, 5.97900390625, 6.4456787109375, 6.912353515625, 7.3790283203125, 7.845703125, 8.3123779296875, 8.779052734375, 9.2457275390625, 9.71240234375, 10.1790771484375, 10.645751953125, 11.1124267578125, 11.5791015625, 12.0457763671875, 12.512451171875, 12.9791259765625, 13.44580078125, 13.9124755859375, 14.379150390625, 14.8458251953125, 15.3125]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 4.0, 5.0, 9.0, 13.0, 6.0, 16.0, 14.0, 11.0, 18.0, 16.0, 21.0, 25.0, 32.0, 28.0, 45.0, 40.0, 23.0, 29.0, 39.0, 46.0, 30.0, 30.0, 44.0, 40.0, 35.0, 33.0, 36.0, 33.0, 34.0, 31.0, 26.0, 25.0, 22.0, 25.0, 18.0, 21.0, 11.0, 7.0, 6.0, 11.0, 9.0, 6.0, 4.0, 8.0, 7.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.4375, -8.153076171875, -7.86865234375, -7.584228515625, -7.2998046875, -7.015380859375, -6.73095703125, -6.446533203125, -6.162109375, -5.877685546875, -5.59326171875, -5.308837890625, -5.0244140625, -4.739990234375, -4.45556640625, -4.171142578125, -3.88671875, -3.602294921875, -3.31787109375, -3.033447265625, -2.7490234375, -2.464599609375, -2.18017578125, -1.895751953125, -1.611328125, -1.326904296875, -1.04248046875, -0.758056640625, -0.4736328125, -0.189208984375, 0.09521484375, 0.379638671875, 0.6640625, 0.948486328125, 1.23291015625, 1.517333984375, 1.8017578125, 2.086181640625, 2.37060546875, 2.655029296875, 2.939453125, 3.223876953125, 3.50830078125, 3.792724609375, 4.0771484375, 4.361572265625, 4.64599609375, 4.930419921875, 5.21484375, 5.499267578125, 5.78369140625, 6.068115234375, 6.3525390625, 6.636962890625, 6.92138671875, 7.205810546875, 7.490234375, 7.774658203125, 8.05908203125, 8.343505859375, 8.6279296875, 8.912353515625, 9.19677734375, 9.481201171875, 9.765625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 2.0, 7.0, 5.0, 12.0, 15.0, 22.0, 16.0, 39.0, 61.0, 83.0, 133.0, 154.0, 263.0, 378.0, 573.0, 910.0, 1433.0, 2267.0, 3729.0, 6125.0, 10359.0, 18087.0, 31966.0, 57475.0, 106626.0, 207591.0, 272323.0, 148455.0, 78358.0, 42812.0, 24009.0, 13499.0, 8041.0, 4750.0, 2852.0, 1809.0, 1144.0, 709.0, 509.0, 299.0, 208.0, 134.0, 91.0, 72.0, 41.0, 38.0, 22.0, 21.0, 10.0, 7.0, 7.0, 7.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-16.078125, -15.57958984375, -15.0810546875, -14.58251953125, -14.083984375, -13.58544921875, -13.0869140625, -12.58837890625, -12.08984375, -11.59130859375, -11.0927734375, -10.59423828125, -10.095703125, -9.59716796875, -9.0986328125, -8.60009765625, -8.1015625, -7.60302734375, -7.1044921875, -6.60595703125, -6.107421875, -5.60888671875, -5.1103515625, -4.61181640625, -4.11328125, -3.61474609375, -3.1162109375, -2.61767578125, -2.119140625, -1.62060546875, -1.1220703125, -0.62353515625, -0.125, 0.37353515625, 0.8720703125, 1.37060546875, 1.869140625, 2.36767578125, 2.8662109375, 3.36474609375, 3.86328125, 4.36181640625, 4.8603515625, 5.35888671875, 5.857421875, 6.35595703125, 6.8544921875, 7.35302734375, 7.8515625, 8.35009765625, 8.8486328125, 9.34716796875, 9.845703125, 10.34423828125, 10.8427734375, 11.34130859375, 11.83984375, 12.33837890625, 12.8369140625, 13.33544921875, 13.833984375, 14.33251953125, 14.8310546875, 15.32958984375, 15.828125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 6.0, 1.0, 9.0, 3.0, 3.0, 19.0, 14.0, 22.0, 23.0, 23.0, 17.0, 20.0, 41.0, 37.0, 37.0, 32.0, 35.0, 51.0, 44.0, 53.0, 32.0, 48.0, 39.0, 47.0, 43.0, 43.0, 35.0, 40.0, 21.0, 32.0, 34.0, 21.0, 11.0, 14.0, 9.0, 10.0, 7.0, 10.0, 4.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6875, -7.46142578125, -7.2353515625, -7.00927734375, -6.783203125, -6.55712890625, -6.3310546875, -6.10498046875, -5.87890625, -5.65283203125, -5.4267578125, -5.20068359375, -4.974609375, -4.74853515625, -4.5224609375, -4.29638671875, -4.0703125, -3.84423828125, -3.6181640625, -3.39208984375, -3.166015625, -2.93994140625, -2.7138671875, -2.48779296875, -2.26171875, -2.03564453125, -1.8095703125, -1.58349609375, -1.357421875, -1.13134765625, -0.9052734375, -0.67919921875, -0.453125, -0.22705078125, -0.0009765625, 0.22509765625, 0.451171875, 0.67724609375, 0.9033203125, 1.12939453125, 1.35546875, 1.58154296875, 1.8076171875, 2.03369140625, 2.259765625, 2.48583984375, 2.7119140625, 2.93798828125, 3.1640625, 3.39013671875, 3.6162109375, 3.84228515625, 4.068359375, 4.29443359375, 4.5205078125, 4.74658203125, 4.97265625, 5.19873046875, 5.4248046875, 5.65087890625, 5.876953125, 6.10302734375, 6.3291015625, 6.55517578125, 6.78125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 2.0, 7.0, 4.0, 18.0, 11.0, 32.0, 30.0, 38.0, 78.0, 102.0, 180.0, 261.0, 406.0, 683.0, 1081.0, 1735.0, 3242.0, 5965.0, 12039.0, 28278.0, 83558.0, 560769.0, 250119.0, 57439.0, 21379.0, 9558.0, 4860.0, 2609.0, 1609.0, 875.0, 577.0, 339.0, 203.0, 143.0, 96.0, 77.0, 49.0, 30.0, 24.0, 14.0, 12.0, 9.0, 4.0, 8.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.859375, -27.980712890625, -27.10205078125, -26.223388671875, -25.3447265625, -24.466064453125, -23.58740234375, -22.708740234375, -21.830078125, -20.951416015625, -20.07275390625, -19.194091796875, -18.3154296875, -17.436767578125, -16.55810546875, -15.679443359375, -14.80078125, -13.922119140625, -13.04345703125, -12.164794921875, -11.2861328125, -10.407470703125, -9.52880859375, -8.650146484375, -7.771484375, -6.892822265625, -6.01416015625, -5.135498046875, -4.2568359375, -3.378173828125, -2.49951171875, -1.620849609375, -0.7421875, 0.136474609375, 1.01513671875, 1.893798828125, 2.7724609375, 3.651123046875, 4.52978515625, 5.408447265625, 6.287109375, 7.165771484375, 8.04443359375, 8.923095703125, 9.8017578125, 10.680419921875, 11.55908203125, 12.437744140625, 13.31640625, 14.195068359375, 15.07373046875, 15.952392578125, 16.8310546875, 17.709716796875, 18.58837890625, 19.467041015625, 20.345703125, 21.224365234375, 22.10302734375, 22.981689453125, 23.8603515625, 24.739013671875, 25.61767578125, 26.496337890625, 27.375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 4.0, 7.0, 9.0, 10.0, 13.0, 19.0, 29.0, 54.0, 63.0, 140.0, 267.0, 137.0, 104.0, 48.0, 32.0, 23.0, 15.0, 7.0, 4.0, 2.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012044906616210938, -0.0011591315269470215, -0.0011137723922729492, -0.001068413257598877, -0.0010230541229248047, -0.0009776949882507324, -0.0009323358535766602, -0.0008869767189025879, -0.0008416175842285156, -0.0007962584495544434, -0.0007508993148803711, -0.0007055401802062988, -0.0006601810455322266, -0.0006148219108581543, -0.000569462776184082, -0.0005241036415100098, -0.0004787445068359375, -0.00043338537216186523, -0.00038802623748779297, -0.0003426671028137207, -0.00029730796813964844, -0.00025194883346557617, -0.0002065896987915039, -0.00016123056411743164, -0.00011587142944335938, -7.051229476928711e-05, -2.5153160095214844e-05, 2.0205974578857422e-05, 6.556510925292969e-05, 0.00011092424392700195, 0.00015628337860107422, 0.00020164251327514648, 0.00024700164794921875, 0.000292360782623291, 0.0003377199172973633, 0.00038307905197143555, 0.0004284381866455078, 0.0004737973213195801, 0.0005191564559936523, 0.0005645155906677246, 0.0006098747253417969, 0.0006552338600158691, 0.0007005929946899414, 0.0007459521293640137, 0.0007913112640380859, 0.0008366703987121582, 0.0008820295333862305, 0.0009273886680603027, 0.000972747802734375, 0.0010181069374084473, 0.0010634660720825195, 0.0011088252067565918, 0.001154184341430664, 0.0011995434761047363, 0.0012449026107788086, 0.0012902617454528809, 0.0013356208801269531, 0.0013809800148010254, 0.0014263391494750977, 0.00147169828414917, 0.0015170574188232422, 0.0015624165534973145, 0.0016077756881713867, 0.001653134822845459, 0.0016984939575195312]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 11.0, 12.0, 15.0, 19.0, 23.0, 25.0, 40.0, 50.0, 83.0, 106.0, 135.0, 199.0, 244.0, 378.0, 518.0, 750.0, 1073.0, 1740.0, 2812.0, 4931.0, 9063.0, 19052.0, 46922.0, 170319.0, 613782.0, 107336.0, 35011.0, 14980.0, 7510.0, 4096.0, 2484.0, 1528.0, 1008.0, 655.0, 467.0, 315.0, 227.0, 169.0, 119.0, 92.0, 55.0, 42.0, 46.0, 33.0, 20.0, 14.0, 12.0, 7.0, 7.0, 11.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0], "bins": [-27.09375, -26.2294921875, -25.365234375, -24.5009765625, -23.63671875, -22.7724609375, -21.908203125, -21.0439453125, -20.1796875, -19.3154296875, -18.451171875, -17.5869140625, -16.72265625, -15.8583984375, -14.994140625, -14.1298828125, -13.265625, -12.4013671875, -11.537109375, -10.6728515625, -9.80859375, -8.9443359375, -8.080078125, -7.2158203125, -6.3515625, -5.4873046875, -4.623046875, -3.7587890625, -2.89453125, -2.0302734375, -1.166015625, -0.3017578125, 0.5625, 1.4267578125, 2.291015625, 3.1552734375, 4.01953125, 4.8837890625, 5.748046875, 6.6123046875, 7.4765625, 8.3408203125, 9.205078125, 10.0693359375, 10.93359375, 11.7978515625, 12.662109375, 13.5263671875, 14.390625, 15.2548828125, 16.119140625, 16.9833984375, 17.84765625, 18.7119140625, 19.576171875, 20.4404296875, 21.3046875, 22.1689453125, 23.033203125, 23.8974609375, 24.76171875, 25.6259765625, 26.490234375, 27.3544921875, 28.21875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 6.0, 11.0, 11.0, 17.0, 14.0, 33.0, 38.0, 48.0, 81.0, 86.0, 165.0, 105.0, 108.0, 66.0, 54.0, 41.0, 24.0, 24.0, 16.0, 6.0, 10.0, 5.0, 8.0, 2.0, 3.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.328125, -8.07440185546875, -7.8206787109375, -7.56695556640625, -7.313232421875, -7.05950927734375, -6.8057861328125, -6.55206298828125, -6.29833984375, -6.04461669921875, -5.7908935546875, -5.53717041015625, -5.283447265625, -5.02972412109375, -4.7760009765625, -4.52227783203125, -4.2685546875, -4.01483154296875, -3.7611083984375, -3.50738525390625, -3.253662109375, -2.99993896484375, -2.7462158203125, -2.49249267578125, -2.23876953125, -1.98504638671875, -1.7313232421875, -1.47760009765625, -1.223876953125, -0.97015380859375, -0.7164306640625, -0.46270751953125, -0.208984375, 0.04473876953125, 0.2984619140625, 0.55218505859375, 0.805908203125, 1.05963134765625, 1.3133544921875, 1.56707763671875, 1.82080078125, 2.07452392578125, 2.3282470703125, 2.58197021484375, 2.835693359375, 3.08941650390625, 3.3431396484375, 3.59686279296875, 3.8505859375, 4.10430908203125, 4.3580322265625, 4.61175537109375, 4.865478515625, 5.11920166015625, 5.3729248046875, 5.62664794921875, 5.88037109375, 6.13409423828125, 6.3878173828125, 6.64154052734375, 6.895263671875, 7.14898681640625, 7.4027099609375, 7.65643310546875, 7.91015625]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 2.0, 10.0, 10.0, 6.0, 17.0, 18.0, 23.0, 33.0, 54.0, 75.0, 104.0, 147.0, 129.0, 86.0, 60.0, 47.0, 40.0, 24.0, 25.0, 14.0, 13.0, 9.0, 6.0, 9.0, 4.0, 3.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.894287109375, -14.371912002563477, -13.849535942077637, -13.327160835266113, -12.804784774780273, -12.28240966796875, -11.760034561157227, -11.237659454345703, -10.715283393859863, -10.19290828704834, -9.6705322265625, -9.148157119750977, -8.625782012939453, -8.103405952453613, -7.58103084564209, -7.058655261993408, -6.536279678344727, -6.013904094696045, -5.491528511047363, -4.96915340423584, -4.446777820587158, -3.9244022369384766, -3.402026891708374, -2.8796515464782715, -2.35727596282959, -1.8349004983901978, -1.3125250339508057, -0.7901495695114136, -0.2677741050720215, 0.25460147857666016, 0.7769768238067627, 1.2993521690368652, 1.8217277526855469, 2.3441033363342285, 2.866478681564331, 3.3888540267944336, 3.9112296104431152, 4.433605194091797, 4.95598030090332, 5.478355884552002, 6.000731468200684, 6.523107051849365, 7.045482635498047, 7.56785774230957, 8.090232849121094, 8.612608909606934, 9.134984016418457, 9.657360076904297, 10.17973518371582, 10.702110290527344, 11.224486351013184, 11.746861457824707, 12.269237518310547, 12.79161262512207, 13.313987731933594, 13.836362838745117, 14.358738899230957, 14.88111400604248, 15.40349006652832, 15.925865173339844, 16.448240280151367, 16.97061538696289, 17.492992401123047, 18.01536750793457, 18.537742614746094]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 9.0, 4.0, 6.0, 7.0, 8.0, 11.0, 10.0, 16.0, 21.0, 20.0, 28.0, 25.0, 27.0, 26.0, 21.0, 29.0, 25.0, 43.0, 40.0, 35.0, 38.0, 46.0, 31.0, 36.0, 33.0, 37.0, 39.0, 33.0, 23.0, 27.0, 26.0, 29.0, 20.0, 26.0, 21.0, 22.0, 16.0, 6.0, 13.0, 13.0, 9.0, 7.0, 6.0, 10.0, 6.0, 6.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-10.119451522827148, -9.8136568069458, -9.507862091064453, -9.202068328857422, -8.896273612976074, -8.590478897094727, -8.284684181213379, -7.978889465332031, -7.673095226287842, -7.367300510406494, -7.061506271362305, -6.755711555480957, -6.449916839599609, -6.14412260055542, -5.838327884674072, -5.532533645629883, -5.226738929748535, -4.9209442138671875, -4.615149974822998, -4.30935525894165, -4.003561019897461, -3.6977663040161133, -3.3919715881347656, -3.086177110671997, -2.7803826332092285, -2.47458815574646, -2.1687936782836914, -1.8629989624023438, -1.5572044849395752, -1.2514100074768066, -0.9456154108047485, -0.6398208141326904, -0.3340263366699219, -0.028231799602508545, 0.2775627374649048, 0.5833572745323181, 0.8891518115997314, 1.1949462890625, 1.500740885734558, 1.8065354824066162, 2.1123299598693848, 2.4181244373321533, 2.723918914794922, 3.0297136306762695, 3.335508108139038, 3.6413025856018066, 3.9470973014831543, 4.252891540527344, 4.558686256408691, 4.864480972290039, 5.1702752113342285, 5.476069927215576, 5.781864166259766, 6.087658882141113, 6.393453598022461, 6.699248313903809, 7.005042552947998, 7.310837268829346, 7.616631507873535, 7.922426223754883, 8.22822093963623, 8.534015655517578, 8.83980941772461, 9.145604133605957, 9.451398849487305]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 6.0, 5.0, 16.0, 23.0, 38.0, 44.0, 78.0, 111.0, 166.0, 250.0, 355.0, 631.0, 931.0, 1293.0, 1968.0, 2836.0, 4220.0, 6391.0, 9734.0, 14848.0, 23515.0, 38929.0, 67272.0, 125078.0, 297728.0, 1153989.0, 1675292.0, 417180.0, 155265.0, 77772.0, 43497.0, 25663.0, 16035.0, 10353.0, 6923.0, 4751.0, 3252.0, 2323.0, 1638.0, 1143.0, 784.0, 588.0, 416.0, 280.0, 192.0, 153.0, 104.0, 76.0, 58.0, 29.0, 23.0, 15.0, 13.0, 7.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.4140625, -11.9730224609375, -11.531982421875, -11.0909423828125, -10.64990234375, -10.2088623046875, -9.767822265625, -9.3267822265625, -8.8857421875, -8.4447021484375, -8.003662109375, -7.5626220703125, -7.12158203125, -6.6805419921875, -6.239501953125, -5.7984619140625, -5.357421875, -4.9163818359375, -4.475341796875, -4.0343017578125, -3.59326171875, -3.1522216796875, -2.711181640625, -2.2701416015625, -1.8291015625, -1.3880615234375, -0.947021484375, -0.5059814453125, -0.06494140625, 0.3760986328125, 0.817138671875, 1.2581787109375, 1.69921875, 2.1402587890625, 2.581298828125, 3.0223388671875, 3.46337890625, 3.9044189453125, 4.345458984375, 4.7864990234375, 5.2275390625, 5.6685791015625, 6.109619140625, 6.5506591796875, 6.99169921875, 7.4327392578125, 7.873779296875, 8.3148193359375, 8.755859375, 9.1968994140625, 9.637939453125, 10.0789794921875, 10.52001953125, 10.9610595703125, 11.402099609375, 11.8431396484375, 12.2841796875, 12.7252197265625, 13.166259765625, 13.6072998046875, 14.04833984375, 14.4893798828125, 14.930419921875, 15.3714599609375, 15.8125]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 8.0, 7.0, 6.0, 7.0, 11.0, 11.0, 17.0, 23.0, 19.0, 15.0, 18.0, 21.0, 24.0, 34.0, 29.0, 30.0, 25.0, 27.0, 37.0, 38.0, 32.0, 39.0, 43.0, 44.0, 36.0, 40.0, 39.0, 19.0, 21.0, 36.0, 28.0, 29.0, 27.0, 30.0, 23.0, 18.0, 8.0, 11.0, 11.0, 9.0, 8.0, 6.0, 3.0, 2.0, 4.0, 5.0, 11.0, 7.0, 1.0, 2.0, 1.0, 1.0], "bins": [-5.8984375, -5.72509765625, -5.5517578125, -5.37841796875, -5.205078125, -5.03173828125, -4.8583984375, -4.68505859375, -4.51171875, -4.33837890625, -4.1650390625, -3.99169921875, -3.818359375, -3.64501953125, -3.4716796875, -3.29833984375, -3.125, -2.95166015625, -2.7783203125, -2.60498046875, -2.431640625, -2.25830078125, -2.0849609375, -1.91162109375, -1.73828125, -1.56494140625, -1.3916015625, -1.21826171875, -1.044921875, -0.87158203125, -0.6982421875, -0.52490234375, -0.3515625, -0.17822265625, -0.0048828125, 0.16845703125, 0.341796875, 0.51513671875, 0.6884765625, 0.86181640625, 1.03515625, 1.20849609375, 1.3818359375, 1.55517578125, 1.728515625, 1.90185546875, 2.0751953125, 2.24853515625, 2.421875, 2.59521484375, 2.7685546875, 2.94189453125, 3.115234375, 3.28857421875, 3.4619140625, 3.63525390625, 3.80859375, 3.98193359375, 4.1552734375, 4.32861328125, 4.501953125, 4.67529296875, 4.8486328125, 5.02197265625, 5.1953125]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 10.0, 14.0, 25.0, 32.0, 39.0, 65.0, 99.0, 154.0, 229.0, 365.0, 507.0, 821.0, 1222.0, 1832.0, 2966.0, 4724.0, 7820.0, 13282.0, 23529.0, 43900.0, 88976.0, 200257.0, 559886.0, 1942588.0, 812854.0, 258231.0, 109839.0, 52629.0, 27685.0, 15545.0, 9261.0, 5401.0, 3403.0, 2102.0, 1385.0, 893.0, 575.0, 370.0, 249.0, 179.0, 109.0, 71.0, 58.0, 30.0, 23.0, 16.0, 10.0, 13.0, 6.0, 4.0, 2.0, 3.0], "bins": [-15.4921875, -15.0574951171875, -14.622802734375, -14.1881103515625, -13.75341796875, -13.3187255859375, -12.884033203125, -12.4493408203125, -12.0146484375, -11.5799560546875, -11.145263671875, -10.7105712890625, -10.27587890625, -9.8411865234375, -9.406494140625, -8.9718017578125, -8.537109375, -8.1024169921875, -7.667724609375, -7.2330322265625, -6.79833984375, -6.3636474609375, -5.928955078125, -5.4942626953125, -5.0595703125, -4.6248779296875, -4.190185546875, -3.7554931640625, -3.32080078125, -2.8861083984375, -2.451416015625, -2.0167236328125, -1.58203125, -1.1473388671875, -0.712646484375, -0.2779541015625, 0.15673828125, 0.5914306640625, 1.026123046875, 1.4608154296875, 1.8955078125, 2.3302001953125, 2.764892578125, 3.1995849609375, 3.63427734375, 4.0689697265625, 4.503662109375, 4.9383544921875, 5.373046875, 5.8077392578125, 6.242431640625, 6.6771240234375, 7.11181640625, 7.5465087890625, 7.981201171875, 8.4158935546875, 8.8505859375, 9.2852783203125, 9.719970703125, 10.1546630859375, 10.58935546875, 11.0240478515625, 11.458740234375, 11.8934326171875, 12.328125]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 4.0, 3.0, 6.0, 3.0, 13.0, 11.0, 12.0, 23.0, 23.0, 27.0, 40.0, 66.0, 60.0, 78.0, 113.0, 133.0, 151.0, 208.0, 291.0, 306.0, 377.0, 400.0, 351.0, 278.0, 223.0, 181.0, 160.0, 117.0, 86.0, 75.0, 58.0, 51.0, 35.0, 23.0, 21.0, 19.0, 9.0, 11.0, 8.0, 11.0, 4.0, 2.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.537109375, -3.412567138671875, -3.28802490234375, -3.163482666015625, -3.0389404296875, -2.914398193359375, -2.78985595703125, -2.665313720703125, -2.540771484375, -2.416229248046875, -2.29168701171875, -2.167144775390625, -2.0426025390625, -1.918060302734375, -1.79351806640625, -1.668975830078125, -1.54443359375, -1.419891357421875, -1.29534912109375, -1.170806884765625, -1.0462646484375, -0.921722412109375, -0.79718017578125, -0.672637939453125, -0.548095703125, -0.423553466796875, -0.29901123046875, -0.174468994140625, -0.0499267578125, 0.074615478515625, 0.19915771484375, 0.323699951171875, 0.4482421875, 0.572784423828125, 0.69732666015625, 0.821868896484375, 0.9464111328125, 1.070953369140625, 1.19549560546875, 1.320037841796875, 1.444580078125, 1.569122314453125, 1.69366455078125, 1.818206787109375, 1.9427490234375, 2.067291259765625, 2.19183349609375, 2.316375732421875, 2.44091796875, 2.565460205078125, 2.69000244140625, 2.814544677734375, 2.9390869140625, 3.063629150390625, 3.18817138671875, 3.312713623046875, 3.437255859375, 3.561798095703125, 3.68634033203125, 3.810882568359375, 3.9354248046875, 4.059967041015625, 4.18450927734375, 4.309051513671875, 4.43359375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 6.0, 8.0, 9.0, 14.0, 19.0, 17.0, 40.0, 47.0, 65.0, 121.0, 190.0, 161.0, 98.0, 65.0, 39.0, 28.0, 19.0, 10.0, 14.0, 9.0, 5.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.638710975646973, -13.131742477416992, -12.624774932861328, -12.117807388305664, -11.610838890075684, -11.103870391845703, -10.596902847290039, -10.089935302734375, -9.582966804504395, -9.075998306274414, -8.56903076171875, -8.062063217163086, -7.5550947189331055, -7.048126697540283, -6.541158676147461, -6.034190654754639, -5.527222633361816, -5.020254611968994, -4.513286590576172, -4.00631856918335, -3.4993505477905273, -2.992382526397705, -2.485414505004883, -1.9784464836120605, -1.4714784622192383, -0.964510440826416, -0.45754241943359375, 0.049425601959228516, 0.5563936233520508, 1.063361644744873, 1.5703296661376953, 2.0772976875305176, 2.5842647552490234, 3.0912327766418457, 3.598200798034668, 4.10516881942749, 4.6121368408203125, 5.119104862213135, 5.626072883605957, 6.133040904998779, 6.640008926391602, 7.146976947784424, 7.653944969177246, 8.160913467407227, 8.66788101196289, 9.174848556518555, 9.681817054748535, 10.188785552978516, 10.69575309753418, 11.202720642089844, 11.709689140319824, 12.216657638549805, 12.723625183105469, 13.230592727661133, 13.737561225891113, 14.244529724121094, 14.751497268676758, 15.258464813232422, 15.765433311462402, 16.272401809692383, 16.779369354248047, 17.28633689880371, 17.793304443359375, 18.300273895263672, 18.807241439819336]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 0.0, 5.0, 9.0, 8.0, 3.0, 8.0, 9.0, 16.0, 19.0, 20.0, 15.0, 20.0, 29.0, 33.0, 32.0, 37.0, 33.0, 31.0, 33.0, 35.0, 52.0, 36.0, 37.0, 41.0, 27.0, 31.0, 27.0, 35.0, 35.0, 28.0, 36.0, 36.0, 30.0, 23.0, 17.0, 15.0, 20.0, 19.0, 8.0, 10.0, 9.0, 11.0, 5.0, 3.0, 4.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.555624485015869, -6.339968681335449, -6.124312877655029, -5.908657073974609, -5.6930012702941895, -5.4773454666137695, -5.261690139770508, -5.04603385925293, -4.830378532409668, -4.614722728729248, -4.399066925048828, -4.183411121368408, -3.9677553176879883, -3.7520995140075684, -3.5364439487457275, -3.3207881450653076, -3.1051321029663086, -2.8894762992858887, -2.6738204956054688, -2.458164691925049, -2.242508888244629, -2.026853084564209, -1.8111975193023682, -1.5955417156219482, -1.3798859119415283, -1.1642301082611084, -0.9485743641853333, -0.7329186201095581, -0.5172628164291382, -0.30160701274871826, -0.08595132827758789, 0.12970447540283203, 0.34535980224609375, 0.5610156059265137, 0.7766713500022888, 0.992327094078064, 1.2079828977584839, 1.4236387014389038, 1.6392943859100342, 1.854950189590454, 2.070605993270874, 2.286261796951294, 2.501917600631714, 2.7175731658935547, 2.9332289695739746, 3.1488847732543945, 3.3645405769348145, 3.5801963806152344, 3.7958521842956543, 4.011507987976074, 4.227163791656494, 4.442819595336914, 4.658475399017334, 4.874131202697754, 5.089786529541016, 5.305442810058594, 5.5210981369018555, 5.736753940582275, 5.952409744262695, 6.168065547943115, 6.383721351623535, 6.599377155303955, 6.815032958984375, 7.030688285827637, 7.246344566345215]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 8.0, 21.0, 31.0, 37.0, 44.0, 65.0, 96.0, 167.0, 232.0, 343.0, 537.0, 844.0, 1330.0, 2373.0, 3942.0, 6931.0, 13523.0, 27368.0, 62315.0, 169479.0, 447946.0, 183917.0, 66131.0, 29007.0, 13893.0, 7465.0, 4080.0, 2421.0, 1417.0, 937.0, 572.0, 324.0, 224.0, 165.0, 121.0, 77.0, 53.0, 31.0, 25.0, 16.0, 8.0, 12.0, 12.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.39453125, -4.26348876953125, -4.1324462890625, -4.00140380859375, -3.870361328125, -3.73931884765625, -3.6082763671875, -3.47723388671875, -3.34619140625, -3.21514892578125, -3.0841064453125, -2.95306396484375, -2.822021484375, -2.69097900390625, -2.5599365234375, -2.42889404296875, -2.2978515625, -2.16680908203125, -2.0357666015625, -1.90472412109375, -1.773681640625, -1.64263916015625, -1.5115966796875, -1.38055419921875, -1.24951171875, -1.11846923828125, -0.9874267578125, -0.85638427734375, -0.725341796875, -0.59429931640625, -0.4632568359375, -0.33221435546875, -0.201171875, -0.07012939453125, 0.0609130859375, 0.19195556640625, 0.322998046875, 0.45404052734375, 0.5850830078125, 0.71612548828125, 0.84716796875, 0.97821044921875, 1.1092529296875, 1.24029541015625, 1.371337890625, 1.50238037109375, 1.6334228515625, 1.76446533203125, 1.8955078125, 2.02655029296875, 2.1575927734375, 2.28863525390625, 2.419677734375, 2.55072021484375, 2.6817626953125, 2.81280517578125, 2.94384765625, 3.07489013671875, 3.2059326171875, 3.33697509765625, 3.468017578125, 3.59906005859375, 3.7301025390625, 3.86114501953125, 3.9921875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 5.0, 4.0, 7.0, 13.0, 7.0, 9.0, 16.0, 20.0, 17.0, 16.0, 20.0, 31.0, 45.0, 31.0, 31.0, 44.0, 41.0, 41.0, 54.0, 46.0, 31.0, 47.0, 38.0, 36.0, 37.0, 37.0, 35.0, 36.0, 33.0, 34.0, 20.0, 20.0, 24.0, 16.0, 9.0, 11.0, 10.0, 9.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7421875, -7.4951171875, -7.248046875, -7.0009765625, -6.75390625, -6.5068359375, -6.259765625, -6.0126953125, -5.765625, -5.5185546875, -5.271484375, -5.0244140625, -4.77734375, -4.5302734375, -4.283203125, -4.0361328125, -3.7890625, -3.5419921875, -3.294921875, -3.0478515625, -2.80078125, -2.5537109375, -2.306640625, -2.0595703125, -1.8125, -1.5654296875, -1.318359375, -1.0712890625, -0.82421875, -0.5771484375, -0.330078125, -0.0830078125, 0.1640625, 0.4111328125, 0.658203125, 0.9052734375, 1.15234375, 1.3994140625, 1.646484375, 1.8935546875, 2.140625, 2.3876953125, 2.634765625, 2.8818359375, 3.12890625, 3.3759765625, 3.623046875, 3.8701171875, 4.1171875, 4.3642578125, 4.611328125, 4.8583984375, 5.10546875, 5.3525390625, 5.599609375, 5.8466796875, 6.09375, 6.3408203125, 6.587890625, 6.8349609375, 7.08203125, 7.3291015625, 7.576171875, 7.8232421875, 8.0703125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 8.0, 4.0, 0.0, 10.0, 8.0, 11.0, 24.0, 9.0, 22.0, 49.0, 67.0, 93.0, 111.0, 169.0, 291.0, 357.0, 597.0, 842.0, 1301.0, 2173.0, 3651.0, 6427.0, 12104.0, 25892.0, 64685.0, 237366.0, 500918.0, 113622.0, 39151.0, 17381.0, 8660.0, 4819.0, 2772.0, 1648.0, 1172.0, 669.0, 448.0, 328.0, 208.0, 153.0, 102.0, 58.0, 48.0, 45.0, 33.0, 17.0, 15.0, 9.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.046875, -5.87530517578125, -5.7037353515625, -5.53216552734375, -5.360595703125, -5.18902587890625, -5.0174560546875, -4.84588623046875, -4.67431640625, -4.50274658203125, -4.3311767578125, -4.15960693359375, -3.988037109375, -3.81646728515625, -3.6448974609375, -3.47332763671875, -3.3017578125, -3.13018798828125, -2.9586181640625, -2.78704833984375, -2.615478515625, -2.44390869140625, -2.2723388671875, -2.10076904296875, -1.92919921875, -1.75762939453125, -1.5860595703125, -1.41448974609375, -1.242919921875, -1.07135009765625, -0.8997802734375, -0.72821044921875, -0.556640625, -0.38507080078125, -0.2135009765625, -0.04193115234375, 0.129638671875, 0.30120849609375, 0.4727783203125, 0.64434814453125, 0.81591796875, 0.98748779296875, 1.1590576171875, 1.33062744140625, 1.502197265625, 1.67376708984375, 1.8453369140625, 2.01690673828125, 2.1884765625, 2.36004638671875, 2.5316162109375, 2.70318603515625, 2.874755859375, 3.04632568359375, 3.2178955078125, 3.38946533203125, 3.56103515625, 3.73260498046875, 3.9041748046875, 4.07574462890625, 4.247314453125, 4.41888427734375, 4.5904541015625, 4.76202392578125, 4.93359375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 13.0, 6.0, 7.0, 11.0, 22.0, 16.0, 25.0, 35.0, 14.0, 30.0, 23.0, 32.0, 47.0, 44.0, 43.0, 35.0, 40.0, 51.0, 32.0, 37.0, 29.0, 36.0, 35.0, 43.0, 30.0, 23.0, 20.0, 38.0, 27.0, 22.0, 19.0, 24.0, 16.0, 13.0, 7.0, 9.0, 5.0, 6.0, 7.0, 7.0, 8.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.953125, -4.79644775390625, -4.6397705078125, -4.48309326171875, -4.326416015625, -4.16973876953125, -4.0130615234375, -3.85638427734375, -3.69970703125, -3.54302978515625, -3.3863525390625, -3.22967529296875, -3.072998046875, -2.91632080078125, -2.7596435546875, -2.60296630859375, -2.4462890625, -2.28961181640625, -2.1329345703125, -1.97625732421875, -1.819580078125, -1.66290283203125, -1.5062255859375, -1.34954833984375, -1.19287109375, -1.03619384765625, -0.8795166015625, -0.72283935546875, -0.566162109375, -0.40948486328125, -0.2528076171875, -0.09613037109375, 0.060546875, 0.21722412109375, 0.3739013671875, 0.53057861328125, 0.687255859375, 0.84393310546875, 1.0006103515625, 1.15728759765625, 1.31396484375, 1.47064208984375, 1.6273193359375, 1.78399658203125, 1.940673828125, 2.09735107421875, 2.2540283203125, 2.41070556640625, 2.5673828125, 2.72406005859375, 2.8807373046875, 3.03741455078125, 3.194091796875, 3.35076904296875, 3.5074462890625, 3.66412353515625, 3.82080078125, 3.97747802734375, 4.1341552734375, 4.29083251953125, 4.447509765625, 4.60418701171875, 4.7608642578125, 4.91754150390625, 5.07421875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 8.0, 7.0, 13.0, 21.0, 31.0, 47.0, 62.0, 92.0, 138.0, 176.0, 267.0, 374.0, 546.0, 836.0, 1117.0, 1790.0, 2793.0, 4545.0, 7781.0, 13475.0, 26008.0, 57832.0, 178591.0, 540191.0, 117774.0, 44203.0, 20794.0, 11263.0, 6590.0, 3940.0, 2385.0, 1576.0, 1047.0, 707.0, 473.0, 299.0, 223.0, 155.0, 103.0, 70.0, 59.0, 39.0, 30.0, 23.0, 25.0, 12.0, 13.0, 6.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.78125, -0.7570953369140625, -0.732940673828125, -0.7087860107421875, -0.68463134765625, -0.6604766845703125, -0.636322021484375, -0.6121673583984375, -0.5880126953125, -0.5638580322265625, -0.539703369140625, -0.5155487060546875, -0.49139404296875, -0.4672393798828125, -0.443084716796875, -0.4189300537109375, -0.394775390625, -0.3706207275390625, -0.346466064453125, -0.3223114013671875, -0.29815673828125, -0.2740020751953125, -0.249847412109375, -0.2256927490234375, -0.2015380859375, -0.1773834228515625, -0.153228759765625, -0.1290740966796875, -0.10491943359375, -0.0807647705078125, -0.056610107421875, -0.0324554443359375, -0.00830078125, 0.0158538818359375, 0.040008544921875, 0.0641632080078125, 0.08831787109375, 0.1124725341796875, 0.136627197265625, 0.1607818603515625, 0.1849365234375, 0.2090911865234375, 0.233245849609375, 0.2574005126953125, 0.28155517578125, 0.3057098388671875, 0.329864501953125, 0.3540191650390625, 0.378173828125, 0.4023284912109375, 0.426483154296875, 0.4506378173828125, 0.47479248046875, 0.4989471435546875, 0.523101806640625, 0.5472564697265625, 0.5714111328125, 0.5955657958984375, 0.619720458984375, 0.6438751220703125, 0.66802978515625, 0.6921844482421875, 0.716339111328125, 0.7404937744140625, 0.7646484375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 2.0, 9.0, 7.0, 19.0, 17.0, 15.0, 33.0, 31.0, 36.0, 61.0, 102.0, 178.0, 148.0, 110.0, 57.0, 49.0, 27.0, 22.0, 12.0, 15.0, 4.0, 7.0, 7.0, 6.0, 2.0, 5.0, 7.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.43865966796875e-05, -7.212255150079727e-05, -6.985850632190704e-05, -6.759446114301682e-05, -6.533041596412659e-05, -6.306637078523636e-05, -6.080232560634613e-05, -5.85382804274559e-05, -5.6274235248565674e-05, -5.4010190069675446e-05, -5.174614489078522e-05, -4.948209971189499e-05, -4.721805453300476e-05, -4.495400935411453e-05, -4.2689964175224304e-05, -4.0425918996334076e-05, -3.816187381744385e-05, -3.589782863855362e-05, -3.363378345966339e-05, -3.136973828077316e-05, -2.9105693101882935e-05, -2.6841647922992706e-05, -2.4577602744102478e-05, -2.231355756521225e-05, -2.004951238632202e-05, -1.7785467207431793e-05, -1.5521422028541565e-05, -1.3257376849651337e-05, -1.0993331670761108e-05, -8.72928649187088e-06, -6.465241312980652e-06, -4.201196134090424e-06, -1.9371509552001953e-06, 3.2689422369003296e-07, 2.5909394025802612e-06, 4.8549845814704895e-06, 7.119029760360718e-06, 9.383074939250946e-06, 1.1647120118141174e-05, 1.3911165297031403e-05, 1.617521047592163e-05, 1.843925565481186e-05, 2.0703300833702087e-05, 2.2967346012592316e-05, 2.5231391191482544e-05, 2.7495436370372772e-05, 2.9759481549263e-05, 3.202352672815323e-05, 3.428757190704346e-05, 3.6551617085933685e-05, 3.8815662264823914e-05, 4.107970744371414e-05, 4.334375262260437e-05, 4.56077978014946e-05, 4.787184298038483e-05, 5.0135888159275055e-05, 5.239993333816528e-05, 5.466397851705551e-05, 5.692802369594574e-05, 5.919206887483597e-05, 6.14561140537262e-05, 6.372015923261642e-05, 6.598420441150665e-05, 6.824824959039688e-05, 7.051229476928711e-05]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 9.0, 10.0, 12.0, 20.0, 25.0, 34.0, 61.0, 72.0, 114.0, 168.0, 219.0, 278.0, 383.0, 552.0, 789.0, 1144.0, 1656.0, 2416.0, 3729.0, 5607.0, 8524.0, 14067.0, 23581.0, 41394.0, 79249.0, 210545.0, 422498.0, 104817.0, 51434.0, 28379.0, 16659.0, 10147.0, 6464.0, 4296.0, 2934.0, 1833.0, 1335.0, 920.0, 652.0, 437.0, 340.0, 236.0, 167.0, 105.0, 73.0, 62.0, 35.0, 21.0, 16.0, 15.0, 11.0, 9.0, 1.0, 6.0, 3.0, 3.0, 0.0, 1.0], "bins": [-1.2548828125, -1.21588134765625, -1.1768798828125, -1.13787841796875, -1.098876953125, -1.05987548828125, -1.0208740234375, -0.98187255859375, -0.94287109375, -0.90386962890625, -0.8648681640625, -0.82586669921875, -0.786865234375, -0.74786376953125, -0.7088623046875, -0.66986083984375, -0.630859375, -0.59185791015625, -0.5528564453125, -0.51385498046875, -0.474853515625, -0.43585205078125, -0.3968505859375, -0.35784912109375, -0.31884765625, -0.27984619140625, -0.2408447265625, -0.20184326171875, -0.162841796875, -0.12384033203125, -0.0848388671875, -0.04583740234375, -0.0068359375, 0.03216552734375, 0.0711669921875, 0.11016845703125, 0.149169921875, 0.18817138671875, 0.2271728515625, 0.26617431640625, 0.30517578125, 0.34417724609375, 0.3831787109375, 0.42218017578125, 0.461181640625, 0.50018310546875, 0.5391845703125, 0.57818603515625, 0.6171875, 0.65618896484375, 0.6951904296875, 0.73419189453125, 0.773193359375, 0.81219482421875, 0.8511962890625, 0.89019775390625, 0.92919921875, 0.96820068359375, 1.0072021484375, 1.04620361328125, 1.085205078125, 1.12420654296875, 1.1632080078125, 1.20220947265625, 1.2412109375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 4.0, 6.0, 2.0, 4.0, 4.0, 8.0, 16.0, 12.0, 14.0, 23.0, 15.0, 24.0, 28.0, 35.0, 21.0, 38.0, 37.0, 40.0, 46.0, 74.0, 97.0, 61.0, 51.0, 44.0, 36.0, 44.0, 41.0, 31.0, 27.0, 19.0, 9.0, 16.0, 9.0, 8.0, 17.0, 4.0, 9.0, 5.0, 4.0, 4.0, 2.0, 4.0, 0.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3525390625, -0.3416175842285156, -0.33069610595703125, -0.3197746276855469, -0.3088531494140625, -0.2979316711425781, -0.28701019287109375, -0.2760887145996094, -0.265167236328125, -0.2542457580566406, -0.24332427978515625, -0.23240280151367188, -0.2214813232421875, -0.21055984497070312, -0.19963836669921875, -0.18871688842773438, -0.17779541015625, -0.16687393188476562, -0.15595245361328125, -0.14503097534179688, -0.1341094970703125, -0.12318801879882812, -0.11226654052734375, -0.10134506225585938, -0.090423583984375, -0.07950210571289062, -0.06858062744140625, -0.057659149169921875, -0.0467376708984375, -0.035816192626953125, -0.02489471435546875, -0.013973236083984375, -0.0030517578125, 0.007869720458984375, 0.01879119873046875, 0.029712677001953125, 0.0406341552734375, 0.051555633544921875, 0.06247711181640625, 0.07339859008789062, 0.084320068359375, 0.09524154663085938, 0.10616302490234375, 0.11708450317382812, 0.1280059814453125, 0.13892745971679688, 0.14984893798828125, 0.16077041625976562, 0.17169189453125, 0.18261337280273438, 0.19353485107421875, 0.20445632934570312, 0.2153778076171875, 0.22629928588867188, 0.23722076416015625, 0.24814224243164062, 0.259063720703125, 0.2699851989746094, 0.28090667724609375, 0.2918281555175781, 0.3027496337890625, 0.3136711120605469, 0.32459259033203125, 0.3355140686035156, 0.346435546875]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 10.0, 8.0, 12.0, 16.0, 21.0, 31.0, 50.0, 55.0, 117.0, 172.0, 187.0, 105.0, 62.0, 42.0, 29.0, 21.0, 14.0, 14.0, 7.0, 8.0, 4.0, 1.0, 3.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.326739311218262, -12.813835144042969, -12.300930976867676, -11.788026809692383, -11.27512264251709, -10.762218475341797, -10.249314308166504, -9.736410140991211, -9.223505973815918, -8.710601806640625, -8.197697639465332, -7.684793472290039, -7.171889305114746, -6.658985137939453, -6.14608097076416, -5.633176803588867, -5.120272636413574, -4.607368469238281, -4.094464302062988, -3.5815601348876953, -3.0686559677124023, -2.5557518005371094, -2.0428476333618164, -1.5299434661865234, -1.0170392990112305, -0.5041351318359375, 0.008769035339355469, 0.5216732025146484, 1.0345773696899414, 1.5474815368652344, 2.0603857040405273, 2.5732898712158203, 3.0861949920654297, 3.5990991592407227, 4.112003326416016, 4.624907493591309, 5.137811660766602, 5.6507158279418945, 6.1636199951171875, 6.6765241622924805, 7.189428329467773, 7.702332496643066, 8.21523666381836, 8.728140830993652, 9.241044998168945, 9.753949165344238, 10.266853332519531, 10.779757499694824, 11.292661666870117, 11.80556583404541, 12.318470001220703, 12.831374168395996, 13.344278335571289, 13.857182502746582, 14.370086669921875, 14.882990837097168, 15.395895004272461, 15.908799171447754, 16.421703338623047, 16.934608459472656, 17.447511672973633, 17.96041488647461, 18.47332000732422, 18.986225128173828, 19.499128341674805]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 5.0, 4.0, 8.0, 6.0, 8.0, 8.0, 9.0, 17.0, 14.0, 22.0, 17.0, 24.0, 36.0, 24.0, 32.0, 34.0, 36.0, 32.0, 39.0, 34.0, 39.0, 53.0, 39.0, 24.0, 30.0, 34.0, 31.0, 34.0, 34.0, 35.0, 26.0, 35.0, 30.0, 22.0, 17.0, 19.0, 18.0, 13.0, 11.0, 8.0, 11.0, 9.0, 3.0, 5.0, 5.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.646876811981201, -6.427663803100586, -6.208450794219971, -5.9892377853393555, -5.770024299621582, -5.550811290740967, -5.331598281860352, -5.112385272979736, -4.893172264099121, -4.673959255218506, -4.454746246337891, -4.235532760620117, -4.016319751739502, -3.7971067428588867, -3.5778937339782715, -3.3586807250976562, -3.139467239379883, -2.9202542304992676, -2.7010409832000732, -2.481827974319458, -2.2626147270202637, -2.0434017181396484, -1.8241887092590332, -1.6049755811691284, -1.3857624530792236, -1.1665493249893188, -0.9473362565040588, -0.7281231880187988, -0.508910059928894, -0.28969693183898926, -0.07048392295837402, 0.14872920513153076, 0.36794281005859375, 0.5871559381484985, 0.8063690066337585, 1.0255820751190186, 1.2447952032089233, 1.4640083312988281, 1.6832213401794434, 1.9024344682693481, 2.121647596359253, 2.340860605239868, 2.5600738525390625, 2.7792868614196777, 2.998499870300293, 3.2177131175994873, 3.4369261264801025, 3.656139373779297, 3.875352382659912, 4.094565391540527, 4.313778400421143, 4.532991409301758, 4.752204895019531, 4.9714179039001465, 5.190630912780762, 5.409843921661377, 5.629056930541992, 5.848269939422607, 6.067482948303223, 6.286696434020996, 6.505909442901611, 6.725122451782227, 6.944335460662842, 7.163548469543457, 7.3827619552612305]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 8.0, 12.0, 11.0, 12.0, 36.0, 49.0, 56.0, 88.0, 136.0, 197.0, 281.0, 461.0, 602.0, 954.0, 1299.0, 1999.0, 2940.0, 4602.0, 7456.0, 11767.0, 19823.0, 34051.0, 61146.0, 114422.0, 222861.0, 256319.0, 135444.0, 71435.0, 39577.0, 22985.0, 13668.0, 8236.0, 5284.0, 3440.0, 2177.0, 1445.0, 1033.0, 685.0, 461.0, 338.0, 232.0, 169.0, 114.0, 78.0, 66.0, 31.0, 24.0, 17.0, 12.0, 10.0, 6.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.625, -11.2515869140625, -10.878173828125, -10.5047607421875, -10.13134765625, -9.7579345703125, -9.384521484375, -9.0111083984375, -8.6376953125, -8.2642822265625, -7.890869140625, -7.5174560546875, -7.14404296875, -6.7706298828125, -6.397216796875, -6.0238037109375, -5.650390625, -5.2769775390625, -4.903564453125, -4.5301513671875, -4.15673828125, -3.7833251953125, -3.409912109375, -3.0364990234375, -2.6630859375, -2.2896728515625, -1.916259765625, -1.5428466796875, -1.16943359375, -0.7960205078125, -0.422607421875, -0.0491943359375, 0.32421875, 0.6976318359375, 1.071044921875, 1.4444580078125, 1.81787109375, 2.1912841796875, 2.564697265625, 2.9381103515625, 3.3115234375, 3.6849365234375, 4.058349609375, 4.4317626953125, 4.80517578125, 5.1785888671875, 5.552001953125, 5.9254150390625, 6.298828125, 6.6722412109375, 7.045654296875, 7.4190673828125, 7.79248046875, 8.1658935546875, 8.539306640625, 8.9127197265625, 9.2861328125, 9.6595458984375, 10.032958984375, 10.4063720703125, 10.77978515625, 11.1531982421875, 11.526611328125, 11.9000244140625, 12.2734375]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 0.0, 4.0, 7.0, 10.0, 10.0, 6.0, 5.0, 12.0, 13.0, 15.0, 17.0, 26.0, 30.0, 33.0, 31.0, 32.0, 35.0, 39.0, 39.0, 44.0, 44.0, 48.0, 38.0, 27.0, 40.0, 38.0, 29.0, 30.0, 35.0, 31.0, 39.0, 32.0, 32.0, 28.0, 16.0, 14.0, 16.0, 10.0, 8.0, 7.0, 9.0, 6.0, 5.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9296875, -5.7274169921875, -5.525146484375, -5.3228759765625, -5.12060546875, -4.9183349609375, -4.716064453125, -4.5137939453125, -4.3115234375, -4.1092529296875, -3.906982421875, -3.7047119140625, -3.50244140625, -3.3001708984375, -3.097900390625, -2.8956298828125, -2.693359375, -2.4910888671875, -2.288818359375, -2.0865478515625, -1.88427734375, -1.6820068359375, -1.479736328125, -1.2774658203125, -1.0751953125, -0.8729248046875, -0.670654296875, -0.4683837890625, -0.26611328125, -0.0638427734375, 0.138427734375, 0.3406982421875, 0.54296875, 0.7452392578125, 0.947509765625, 1.1497802734375, 1.35205078125, 1.5543212890625, 1.756591796875, 1.9588623046875, 2.1611328125, 2.3634033203125, 2.565673828125, 2.7679443359375, 2.97021484375, 3.1724853515625, 3.374755859375, 3.5770263671875, 3.779296875, 3.9815673828125, 4.183837890625, 4.3861083984375, 4.58837890625, 4.7906494140625, 4.992919921875, 5.1951904296875, 5.3974609375, 5.5997314453125, 5.802001953125, 6.0042724609375, 6.20654296875, 6.4088134765625, 6.611083984375, 6.8133544921875, 7.015625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 6.0, 10.0, 13.0, 14.0, 21.0, 26.0, 46.0, 58.0, 85.0, 121.0, 192.0, 291.0, 412.0, 630.0, 946.0, 1601.0, 2585.0, 4023.0, 6770.0, 11231.0, 19221.0, 33134.0, 57280.0, 103004.0, 191708.0, 258292.0, 156162.0, 84442.0, 47512.0, 27910.0, 16147.0, 9556.0, 5680.0, 3371.0, 2107.0, 1326.0, 898.0, 553.0, 383.0, 243.0, 168.0, 118.0, 83.0, 50.0, 43.0, 28.0, 18.0, 9.0, 6.0, 6.0, 4.0, 4.0, 3.0, 3.0, 3.0], "bins": [-12.0625, -11.711181640625, -11.35986328125, -11.008544921875, -10.6572265625, -10.305908203125, -9.95458984375, -9.603271484375, -9.251953125, -8.900634765625, -8.54931640625, -8.197998046875, -7.8466796875, -7.495361328125, -7.14404296875, -6.792724609375, -6.44140625, -6.090087890625, -5.73876953125, -5.387451171875, -5.0361328125, -4.684814453125, -4.33349609375, -3.982177734375, -3.630859375, -3.279541015625, -2.92822265625, -2.576904296875, -2.2255859375, -1.874267578125, -1.52294921875, -1.171630859375, -0.8203125, -0.468994140625, -0.11767578125, 0.233642578125, 0.5849609375, 0.936279296875, 1.28759765625, 1.638916015625, 1.990234375, 2.341552734375, 2.69287109375, 3.044189453125, 3.3955078125, 3.746826171875, 4.09814453125, 4.449462890625, 4.80078125, 5.152099609375, 5.50341796875, 5.854736328125, 6.2060546875, 6.557373046875, 6.90869140625, 7.260009765625, 7.611328125, 7.962646484375, 8.31396484375, 8.665283203125, 9.0166015625, 9.367919921875, 9.71923828125, 10.070556640625, 10.421875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 7.0, 6.0, 14.0, 11.0, 14.0, 13.0, 16.0, 18.0, 24.0, 17.0, 21.0, 21.0, 28.0, 29.0, 20.0, 30.0, 44.0, 37.0, 43.0, 35.0, 48.0, 27.0, 33.0, 43.0, 34.0, 36.0, 38.0, 31.0, 26.0, 35.0, 22.0, 19.0, 23.0, 24.0, 12.0, 20.0, 13.0, 15.0, 11.0, 7.0, 5.0, 6.0, 5.0, 4.0, 1.0, 5.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.736328125, -3.613494873046875, -3.49066162109375, -3.367828369140625, -3.2449951171875, -3.122161865234375, -2.99932861328125, -2.876495361328125, -2.753662109375, -2.630828857421875, -2.50799560546875, -2.385162353515625, -2.2623291015625, -2.139495849609375, -2.01666259765625, -1.893829345703125, -1.77099609375, -1.648162841796875, -1.52532958984375, -1.402496337890625, -1.2796630859375, -1.156829833984375, -1.03399658203125, -0.911163330078125, -0.788330078125, -0.665496826171875, -0.54266357421875, -0.419830322265625, -0.2969970703125, -0.174163818359375, -0.05133056640625, 0.071502685546875, 0.1943359375, 0.317169189453125, 0.44000244140625, 0.562835693359375, 0.6856689453125, 0.808502197265625, 0.93133544921875, 1.054168701171875, 1.177001953125, 1.299835205078125, 1.42266845703125, 1.545501708984375, 1.6683349609375, 1.791168212890625, 1.91400146484375, 2.036834716796875, 2.15966796875, 2.282501220703125, 2.40533447265625, 2.528167724609375, 2.6510009765625, 2.773834228515625, 2.89666748046875, 3.019500732421875, 3.142333984375, 3.265167236328125, 3.38800048828125, 3.510833740234375, 3.6336669921875, 3.756500244140625, 3.87933349609375, 4.002166748046875, 4.125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 7.0, 7.0, 14.0, 16.0, 25.0, 30.0, 45.0, 54.0, 69.0, 95.0, 119.0, 171.0, 243.0, 375.0, 483.0, 708.0, 922.0, 1410.0, 2065.0, 3289.0, 5594.0, 9751.0, 18899.0, 43665.0, 145498.0, 657206.0, 89517.0, 32076.0, 14826.0, 7961.0, 4612.0, 2792.0, 1829.0, 1177.0, 825.0, 576.0, 446.0, 306.0, 251.0, 180.0, 125.0, 81.0, 58.0, 43.0, 32.0, 26.0, 23.0, 6.0, 12.0, 7.0, 8.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-14.125, -13.701171875, -13.27734375, -12.853515625, -12.4296875, -12.005859375, -11.58203125, -11.158203125, -10.734375, -10.310546875, -9.88671875, -9.462890625, -9.0390625, -8.615234375, -8.19140625, -7.767578125, -7.34375, -6.919921875, -6.49609375, -6.072265625, -5.6484375, -5.224609375, -4.80078125, -4.376953125, -3.953125, -3.529296875, -3.10546875, -2.681640625, -2.2578125, -1.833984375, -1.41015625, -0.986328125, -0.5625, -0.138671875, 0.28515625, 0.708984375, 1.1328125, 1.556640625, 1.98046875, 2.404296875, 2.828125, 3.251953125, 3.67578125, 4.099609375, 4.5234375, 4.947265625, 5.37109375, 5.794921875, 6.21875, 6.642578125, 7.06640625, 7.490234375, 7.9140625, 8.337890625, 8.76171875, 9.185546875, 9.609375, 10.033203125, 10.45703125, 10.880859375, 11.3046875, 11.728515625, 12.15234375, 12.576171875, 13.0]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 6.0, 5.0, 13.0, 29.0, 32.0, 52.0, 118.0, 421.0, 157.0, 56.0, 32.0, 23.0, 13.0, 18.0, 12.0, 6.0, 1.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00099945068359375, -0.0009656250476837158, -0.0009317994117736816, -0.0008979737758636475, -0.0008641481399536133, -0.0008303225040435791, -0.0007964968681335449, -0.0007626712322235107, -0.0007288455963134766, -0.0006950199604034424, -0.0006611943244934082, -0.000627368688583374, -0.0005935430526733398, -0.0005597174167633057, -0.0005258917808532715, -0.0004920661449432373, -0.0004582405090332031, -0.00042441487312316895, -0.00039058923721313477, -0.0003567636013031006, -0.0003229379653930664, -0.0002891123294830322, -0.00025528669357299805, -0.00022146105766296387, -0.0001876354217529297, -0.0001538097858428955, -0.00011998414993286133, -8.615851402282715e-05, -5.233287811279297e-05, -1.850724220275879e-05, 1.531839370727539e-05, 4.914402961730957e-05, 8.296966552734375e-05, 0.00011679530143737793, 0.0001506209373474121, 0.0001844465732574463, 0.00021827220916748047, 0.00025209784507751465, 0.00028592348098754883, 0.000319749116897583, 0.0003535747528076172, 0.00038740038871765137, 0.00042122602462768555, 0.0004550516605377197, 0.0004888772964477539, 0.0005227029323577881, 0.0005565285682678223, 0.0005903542041778564, 0.0006241798400878906, 0.0006580054759979248, 0.000691831111907959, 0.0007256567478179932, 0.0007594823837280273, 0.0007933080196380615, 0.0008271336555480957, 0.0008609592914581299, 0.0008947849273681641, 0.0009286105632781982, 0.0009624361991882324, 0.0009962618350982666, 0.0010300874710083008, 0.001063913106918335, 0.0010977387428283691, 0.0011315643787384033, 0.0011653900146484375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 2.0, 4.0, 9.0, 2.0, 8.0, 13.0, 14.0, 33.0, 37.0, 62.0, 70.0, 84.0, 107.0, 155.0, 184.0, 261.0, 411.0, 566.0, 794.0, 1141.0, 1800.0, 2957.0, 4671.0, 8274.0, 16254.0, 36824.0, 109128.0, 673297.0, 114937.0, 37811.0, 16569.0, 8510.0, 4791.0, 2872.0, 1826.0, 1177.0, 825.0, 545.0, 385.0, 302.0, 209.0, 165.0, 130.0, 85.0, 51.0, 52.0, 35.0, 35.0, 26.0, 15.0, 13.0, 16.0, 12.0, 2.0, 5.0, 1.0, 4.0], "bins": [-14.1875, -13.7764892578125, -13.365478515625, -12.9544677734375, -12.54345703125, -12.1324462890625, -11.721435546875, -11.3104248046875, -10.8994140625, -10.4884033203125, -10.077392578125, -9.6663818359375, -9.25537109375, -8.8443603515625, -8.433349609375, -8.0223388671875, -7.611328125, -7.2003173828125, -6.789306640625, -6.3782958984375, -5.96728515625, -5.5562744140625, -5.145263671875, -4.7342529296875, -4.3232421875, -3.9122314453125, -3.501220703125, -3.0902099609375, -2.67919921875, -2.2681884765625, -1.857177734375, -1.4461669921875, -1.03515625, -0.6241455078125, -0.213134765625, 0.1978759765625, 0.60888671875, 1.0198974609375, 1.430908203125, 1.8419189453125, 2.2529296875, 2.6639404296875, 3.074951171875, 3.4859619140625, 3.89697265625, 4.3079833984375, 4.718994140625, 5.1300048828125, 5.541015625, 5.9520263671875, 6.363037109375, 6.7740478515625, 7.18505859375, 7.5960693359375, 8.007080078125, 8.4180908203125, 8.8291015625, 9.2401123046875, 9.651123046875, 10.0621337890625, 10.47314453125, 10.8841552734375, 11.295166015625, 11.7061767578125, 12.1171875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 3.0, 5.0, 10.0, 12.0, 17.0, 13.0, 11.0, 14.0, 36.0, 36.0, 49.0, 64.0, 71.0, 316.0, 64.0, 61.0, 46.0, 50.0, 28.0, 13.0, 19.0, 7.0, 14.0, 9.0, 6.0, 5.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.23046875, -3.1168212890625, -3.003173828125, -2.8895263671875, -2.77587890625, -2.6622314453125, -2.548583984375, -2.4349365234375, -2.3212890625, -2.2076416015625, -2.093994140625, -1.9803466796875, -1.86669921875, -1.7530517578125, -1.639404296875, -1.5257568359375, -1.412109375, -1.2984619140625, -1.184814453125, -1.0711669921875, -0.95751953125, -0.8438720703125, -0.730224609375, -0.6165771484375, -0.5029296875, -0.3892822265625, -0.275634765625, -0.1619873046875, -0.04833984375, 0.0653076171875, 0.178955078125, 0.2926025390625, 0.40625, 0.5198974609375, 0.633544921875, 0.7471923828125, 0.86083984375, 0.9744873046875, 1.088134765625, 1.2017822265625, 1.3154296875, 1.4290771484375, 1.542724609375, 1.6563720703125, 1.77001953125, 1.8836669921875, 1.997314453125, 2.1109619140625, 2.224609375, 2.3382568359375, 2.451904296875, 2.5655517578125, 2.67919921875, 2.7928466796875, 2.906494140625, 3.0201416015625, 3.1337890625, 3.2474365234375, 3.361083984375, 3.4747314453125, 3.58837890625, 3.7020263671875, 3.815673828125, 3.9293212890625, 4.04296875]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 7.0, 4.0, 11.0, 20.0, 15.0, 25.0, 32.0, 41.0, 74.0, 108.0, 139.0, 149.0, 99.0, 76.0, 44.0, 42.0, 26.0, 18.0, 15.0, 5.0, 11.0, 7.0, 6.0, 5.0, 5.0, 0.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.125228881835938, -10.752588272094727, -10.3799467086792, -10.007306098937988, -9.634665489196777, -9.26202392578125, -8.889383316040039, -8.516742706298828, -8.144102096557617, -7.771461009979248, -7.398820400238037, -7.026179313659668, -6.653538703918457, -6.280897617340088, -5.908256530761719, -5.535615921020508, -5.1629743576049805, -4.790333271026611, -4.4176926612854, -4.045051574707031, -3.672410726547241, -3.299769878387451, -2.927128791809082, -2.554487943649292, -2.181847095489502, -1.809206247329712, -1.4365652799606323, -1.0639243125915527, -0.6912834644317627, -0.31864261627197266, 0.053998470306396484, 0.4266393184661865, 0.7992792129516602, 1.1719200611114502, 1.5445610284805298, 1.9172019958496094, 2.2898428440093994, 2.6624836921691895, 3.0351247787475586, 3.4077656269073486, 3.7804064750671387, 4.153047561645508, 4.525688171386719, 4.898329257965088, 5.270970344543457, 5.643610954284668, 6.016252040863037, 6.388893127441406, 6.761533737182617, 7.134174823760986, 7.506815433502197, 7.879456520080566, 8.252097129821777, 8.624738693237305, 8.997379302978516, 9.370019912719727, 9.742660522460938, 10.115301132202148, 10.487942695617676, 10.860583305358887, 11.233223915100098, 11.605865478515625, 11.978506088256836, 12.351146697998047, 12.723788261413574]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 3.0, 8.0, 9.0, 4.0, 14.0, 12.0, 16.0, 20.0, 15.0, 23.0, 15.0, 26.0, 36.0, 26.0, 28.0, 38.0, 35.0, 47.0, 27.0, 36.0, 36.0, 24.0, 31.0, 26.0, 42.0, 33.0, 36.0, 39.0, 41.0, 33.0, 19.0, 25.0, 27.0, 20.0, 23.0, 12.0, 20.0, 13.0, 8.0, 8.0, 11.0, 6.0, 5.0, 4.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.106066703796387, -5.912587642669678, -5.7191081047058105, -5.525629043579102, -5.332149982452393, -5.138670921325684, -4.945191383361816, -4.751712322235107, -4.558233261108398, -4.3647541999816895, -4.171274662017822, -3.9777956008911133, -3.7843165397644043, -3.590837240219116, -3.397357940673828, -3.203878879547119, -3.010399580001831, -2.816920280456543, -2.623441219329834, -2.429961919784546, -2.236482858657837, -2.043003559112549, -1.8495243787765503, -1.6560451984405518, -1.4625660181045532, -1.2690868377685547, -1.0756076574325562, -0.8821284174919128, -0.6886492371559143, -0.49517005681991577, -0.30169081687927246, -0.10821163654327393, 0.08526754379272461, 0.27874672412872314, 0.47222593426704407, 0.665705144405365, 0.8591843247413635, 1.0526635646820068, 1.2461427450180054, 1.439621925354004, 1.6331011056900024, 1.826580286026001, 2.020059585571289, 2.213538646697998, 2.407017946243286, 2.600497007369995, 2.793976306915283, 2.987455368041992, 3.1809346675872803, 3.3744139671325684, 3.5678930282592773, 3.7613723278045654, 3.9548513889312744, 4.1483306884765625, 4.3418097496032715, 4.5352888107299805, 4.728768348693848, 4.922247409820557, 5.115726947784424, 5.309206008911133, 5.502685070037842, 5.696164131164551, 5.889643669128418, 6.083122730255127, 6.276601791381836]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 4.0, 6.0, 9.0, 7.0, 10.0, 24.0, 27.0, 45.0, 63.0, 94.0, 115.0, 181.0, 237.0, 369.0, 471.0, 716.0, 961.0, 1320.0, 1981.0, 2728.0, 4029.0, 5957.0, 8870.0, 13686.0, 21582.0, 35207.0, 60137.0, 112125.0, 253482.0, 897753.0, 1786750.0, 564229.0, 192937.0, 91799.0, 50501.0, 29967.0, 18571.0, 11781.0, 8040.0, 5369.0, 3751.0, 2480.0, 1814.0, 1199.0, 906.0, 591.0, 440.0, 295.0, 217.0, 144.0, 101.0, 84.0, 37.0, 25.0, 25.0, 20.0, 9.0, 6.0, 4.0, 8.0], "bins": [-9.609375, -9.3294677734375, -9.049560546875, -8.7696533203125, -8.48974609375, -8.2098388671875, -7.929931640625, -7.6500244140625, -7.3701171875, -7.0902099609375, -6.810302734375, -6.5303955078125, -6.25048828125, -5.9705810546875, -5.690673828125, -5.4107666015625, -5.130859375, -4.8509521484375, -4.571044921875, -4.2911376953125, -4.01123046875, -3.7313232421875, -3.451416015625, -3.1715087890625, -2.8916015625, -2.6116943359375, -2.331787109375, -2.0518798828125, -1.77197265625, -1.4920654296875, -1.212158203125, -0.9322509765625, -0.65234375, -0.3724365234375, -0.092529296875, 0.1873779296875, 0.46728515625, 0.7471923828125, 1.027099609375, 1.3070068359375, 1.5869140625, 1.8668212890625, 2.146728515625, 2.4266357421875, 2.70654296875, 2.9864501953125, 3.266357421875, 3.5462646484375, 3.826171875, 4.1060791015625, 4.385986328125, 4.6658935546875, 4.94580078125, 5.2257080078125, 5.505615234375, 5.7855224609375, 6.0654296875, 6.3453369140625, 6.625244140625, 6.9051513671875, 7.18505859375, 7.4649658203125, 7.744873046875, 8.0247802734375, 8.3046875]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 0.0, 6.0, 4.0, 10.0, 5.0, 4.0, 9.0, 7.0, 13.0, 15.0, 14.0, 27.0, 22.0, 18.0, 25.0, 23.0, 35.0, 39.0, 33.0, 45.0, 35.0, 32.0, 38.0, 39.0, 26.0, 25.0, 42.0, 36.0, 45.0, 46.0, 39.0, 31.0, 30.0, 21.0, 20.0, 19.0, 12.0, 20.0, 21.0, 14.0, 7.0, 20.0, 8.0, 2.0, 5.0, 1.0, 5.0, 3.0, 0.0, 5.0, 3.0, 2.0, 1.0, 1.0], "bins": [-4.1875, -4.06378173828125, -3.9400634765625, -3.81634521484375, -3.692626953125, -3.56890869140625, -3.4451904296875, -3.32147216796875, -3.19775390625, -3.07403564453125, -2.9503173828125, -2.82659912109375, -2.702880859375, -2.57916259765625, -2.4554443359375, -2.33172607421875, -2.2080078125, -2.08428955078125, -1.9605712890625, -1.83685302734375, -1.713134765625, -1.58941650390625, -1.4656982421875, -1.34197998046875, -1.21826171875, -1.09454345703125, -0.9708251953125, -0.84710693359375, -0.723388671875, -0.59967041015625, -0.4759521484375, -0.35223388671875, -0.228515625, -0.10479736328125, 0.0189208984375, 0.14263916015625, 0.266357421875, 0.39007568359375, 0.5137939453125, 0.63751220703125, 0.76123046875, 0.88494873046875, 1.0086669921875, 1.13238525390625, 1.256103515625, 1.37982177734375, 1.5035400390625, 1.62725830078125, 1.7509765625, 1.87469482421875, 1.9984130859375, 2.12213134765625, 2.245849609375, 2.36956787109375, 2.4932861328125, 2.61700439453125, 2.74072265625, 2.86444091796875, 2.9881591796875, 3.11187744140625, 3.235595703125, 3.35931396484375, 3.4830322265625, 3.60675048828125, 3.73046875]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 8.0, 16.0, 7.0, 18.0, 26.0, 49.0, 61.0, 70.0, 118.0, 192.0, 302.0, 454.0, 707.0, 1160.0, 1916.0, 3062.0, 5247.0, 9587.0, 17654.0, 34301.0, 71583.0, 166064.0, 465720.0, 1830124.0, 1058544.0, 299100.0, 116907.0, 52853.0, 26010.0, 13696.0, 7650.0, 4314.0, 2569.0, 1516.0, 921.0, 615.0, 370.0, 255.0, 169.0, 108.0, 82.0, 53.0, 34.0, 26.0, 9.0, 18.0, 7.0, 4.0, 1.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.4375, -9.131103515625, -8.82470703125, -8.518310546875, -8.2119140625, -7.905517578125, -7.59912109375, -7.292724609375, -6.986328125, -6.679931640625, -6.37353515625, -6.067138671875, -5.7607421875, -5.454345703125, -5.14794921875, -4.841552734375, -4.53515625, -4.228759765625, -3.92236328125, -3.615966796875, -3.3095703125, -3.003173828125, -2.69677734375, -2.390380859375, -2.083984375, -1.777587890625, -1.47119140625, -1.164794921875, -0.8583984375, -0.552001953125, -0.24560546875, 0.060791015625, 0.3671875, 0.673583984375, 0.97998046875, 1.286376953125, 1.5927734375, 1.899169921875, 2.20556640625, 2.511962890625, 2.818359375, 3.124755859375, 3.43115234375, 3.737548828125, 4.0439453125, 4.350341796875, 4.65673828125, 4.963134765625, 5.26953125, 5.575927734375, 5.88232421875, 6.188720703125, 6.4951171875, 6.801513671875, 7.10791015625, 7.414306640625, 7.720703125, 8.027099609375, 8.33349609375, 8.639892578125, 8.9462890625, 9.252685546875, 9.55908203125, 9.865478515625, 10.171875]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 5.0, 6.0, 6.0, 5.0, 17.0, 13.0, 10.0, 24.0, 30.0, 39.0, 52.0, 75.0, 83.0, 98.0, 125.0, 189.0, 194.0, 241.0, 266.0, 343.0, 402.0, 338.0, 295.0, 258.0, 207.0, 147.0, 132.0, 95.0, 86.0, 64.0, 59.0, 37.0, 35.0, 28.0, 20.0, 9.0, 12.0, 11.0, 7.0, 4.0, 3.0, 3.0, 0.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.638671875, -2.558074951171875, -2.47747802734375, -2.396881103515625, -2.3162841796875, -2.235687255859375, -2.15509033203125, -2.074493408203125, -1.993896484375, -1.913299560546875, -1.83270263671875, -1.752105712890625, -1.6715087890625, -1.590911865234375, -1.51031494140625, -1.429718017578125, -1.34912109375, -1.268524169921875, -1.18792724609375, -1.107330322265625, -1.0267333984375, -0.946136474609375, -0.86553955078125, -0.784942626953125, -0.704345703125, -0.623748779296875, -0.54315185546875, -0.462554931640625, -0.3819580078125, -0.301361083984375, -0.22076416015625, -0.140167236328125, -0.0595703125, 0.021026611328125, 0.10162353515625, 0.182220458984375, 0.2628173828125, 0.343414306640625, 0.42401123046875, 0.504608154296875, 0.585205078125, 0.665802001953125, 0.74639892578125, 0.826995849609375, 0.9075927734375, 0.988189697265625, 1.06878662109375, 1.149383544921875, 1.22998046875, 1.310577392578125, 1.39117431640625, 1.471771240234375, 1.5523681640625, 1.632965087890625, 1.71356201171875, 1.794158935546875, 1.874755859375, 1.955352783203125, 2.03594970703125, 2.116546630859375, 2.1971435546875, 2.277740478515625, 2.35833740234375, 2.438934326171875, 2.51953125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 3.0, 2.0, 2.0, 2.0, 8.0, 6.0, 6.0, 10.0, 14.0, 22.0, 26.0, 34.0, 65.0, 68.0, 122.0, 143.0, 120.0, 110.0, 61.0, 42.0, 38.0, 26.0, 23.0, 17.0, 9.0, 4.0, 6.0, 7.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.236019134521484, -8.955768585205078, -8.675518989562988, -8.395269393920898, -8.115018844604492, -7.834768772125244, -7.554518699645996, -7.274268627166748, -6.9940185546875, -6.713768482208252, -6.433518409729004, -6.153268337249756, -5.873018264770508, -5.59276819229126, -5.312518119812012, -5.032268047332764, -4.752017974853516, -4.471767902374268, -4.1915178298950195, -3.9112677574157715, -3.6310176849365234, -3.3507676124572754, -3.0705175399780273, -2.7902674674987793, -2.5100173950195312, -2.229767322540283, -1.9495172500610352, -1.669267177581787, -1.389017105102539, -1.108767032623291, -0.828516960144043, -0.5482668876647949, -0.2680177688598633, 0.012232303619384766, 0.2924823760986328, 0.5727324485778809, 0.8529825210571289, 1.133232593536377, 1.413482666015625, 1.693732738494873, 1.973982810974121, 2.254232883453369, 2.534482955932617, 2.8147330284118652, 3.0949831008911133, 3.3752331733703613, 3.6554832458496094, 3.9357333183288574, 4.2159833908081055, 4.4962334632873535, 4.776483535766602, 5.05673360824585, 5.336983680725098, 5.617233753204346, 5.897483825683594, 6.177733898162842, 6.45798397064209, 6.738234043121338, 7.018484115600586, 7.298734188079834, 7.578984260559082, 7.85923433303833, 8.139484405517578, 8.419734954833984, 8.699984550476074]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 7.0, 5.0, 6.0, 11.0, 18.0, 5.0, 17.0, 13.0, 26.0, 23.0, 21.0, 19.0, 37.0, 39.0, 34.0, 22.0, 42.0, 28.0, 44.0, 39.0, 34.0, 39.0, 29.0, 36.0, 30.0, 39.0, 34.0, 37.0, 45.0, 24.0, 23.0, 29.0, 22.0, 19.0, 11.0, 17.0, 13.0, 10.0, 8.0, 15.0, 6.0, 5.0, 5.0, 3.0, 8.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-4.933816432952881, -4.792288303375244, -4.650760173797607, -4.509232044219971, -4.367703437805176, -4.226175308227539, -4.084647178649902, -3.9431190490722656, -3.801590919494629, -3.660062789916992, -3.5185346603393555, -3.3770062923431396, -3.235478162765503, -3.093950033187866, -2.9524216651916504, -2.8108935356140137, -2.669365406036377, -2.5278372764587402, -2.3863091468811035, -2.2447807788848877, -2.103252649307251, -1.9617245197296143, -1.820196270942688, -1.6786680221557617, -1.537139892578125, -1.3956117630004883, -1.254083514213562, -1.1125552654266357, -0.971027135848999, -0.8294989466667175, -0.687970757484436, -0.5464425683021545, -0.40491485595703125, -0.26338666677474976, -0.12185847759246826, 0.019669711589813232, 0.16119790077209473, 0.3027260899543762, 0.4442542791366577, 0.5857824683189392, 0.7273106575012207, 0.8688388466835022, 1.0103670358657837, 1.15189528465271, 1.2934234142303467, 1.4349515438079834, 1.5764797925949097, 1.718008041381836, 1.8595361709594727, 2.0010643005371094, 2.142592430114746, 2.284120798110962, 2.4256489276885986, 2.5671770572662354, 2.708705425262451, 2.850233554840088, 2.9917616844177246, 3.1332898139953613, 3.274817943572998, 3.416346311569214, 3.5578744411468506, 3.6994025707244873, 3.840930938720703, 3.98245906829834, 4.123987197875977]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 6.0, 10.0, 12.0, 18.0, 30.0, 42.0, 39.0, 74.0, 105.0, 150.0, 203.0, 340.0, 498.0, 667.0, 1061.0, 1536.0, 2524.0, 3642.0, 5983.0, 9693.0, 16739.0, 30442.0, 59156.0, 130432.0, 334080.0, 244610.0, 98790.0, 46591.0, 24652.0, 13773.0, 8067.0, 5082.0, 3164.0, 2044.0, 1395.0, 921.0, 628.0, 416.0, 271.0, 195.0, 138.0, 110.0, 65.0, 52.0, 37.0, 20.0, 14.0, 13.0, 13.0, 7.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.00390625, -1.940948486328125, -1.87799072265625, -1.815032958984375, -1.7520751953125, -1.689117431640625, -1.62615966796875, -1.563201904296875, -1.500244140625, -1.437286376953125, -1.37432861328125, -1.311370849609375, -1.2484130859375, -1.185455322265625, -1.12249755859375, -1.059539794921875, -0.99658203125, -0.933624267578125, -0.87066650390625, -0.807708740234375, -0.7447509765625, -0.681793212890625, -0.61883544921875, -0.555877685546875, -0.492919921875, -0.429962158203125, -0.36700439453125, -0.304046630859375, -0.2410888671875, -0.178131103515625, -0.11517333984375, -0.052215576171875, 0.0107421875, 0.073699951171875, 0.13665771484375, 0.199615478515625, 0.2625732421875, 0.325531005859375, 0.38848876953125, 0.451446533203125, 0.514404296875, 0.577362060546875, 0.64031982421875, 0.703277587890625, 0.7662353515625, 0.829193115234375, 0.89215087890625, 0.955108642578125, 1.01806640625, 1.081024169921875, 1.14398193359375, 1.206939697265625, 1.2698974609375, 1.332855224609375, 1.39581298828125, 1.458770751953125, 1.521728515625, 1.584686279296875, 1.64764404296875, 1.710601806640625, 1.7735595703125, 1.836517333984375, 1.89947509765625, 1.962432861328125, 2.025390625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 5.0, 4.0, 0.0, 2.0, 4.0, 7.0, 7.0, 12.0, 13.0, 16.0, 22.0, 18.0, 16.0, 21.0, 17.0, 24.0, 38.0, 32.0, 32.0, 22.0, 42.0, 26.0, 41.0, 36.0, 36.0, 33.0, 39.0, 34.0, 37.0, 33.0, 34.0, 33.0, 31.0, 36.0, 31.0, 14.0, 27.0, 20.0, 20.0, 15.0, 11.0, 15.0, 14.0, 5.0, 10.0, 4.0, 5.0, 3.0, 5.0, 2.0, 5.0, 0.0, 3.0, 0.0, 3.0], "bins": [-4.87890625, -4.73681640625, -4.5947265625, -4.45263671875, -4.310546875, -4.16845703125, -4.0263671875, -3.88427734375, -3.7421875, -3.60009765625, -3.4580078125, -3.31591796875, -3.173828125, -3.03173828125, -2.8896484375, -2.74755859375, -2.60546875, -2.46337890625, -2.3212890625, -2.17919921875, -2.037109375, -1.89501953125, -1.7529296875, -1.61083984375, -1.46875, -1.32666015625, -1.1845703125, -1.04248046875, -0.900390625, -0.75830078125, -0.6162109375, -0.47412109375, -0.33203125, -0.18994140625, -0.0478515625, 0.09423828125, 0.236328125, 0.37841796875, 0.5205078125, 0.66259765625, 0.8046875, 0.94677734375, 1.0888671875, 1.23095703125, 1.373046875, 1.51513671875, 1.6572265625, 1.79931640625, 1.94140625, 2.08349609375, 2.2255859375, 2.36767578125, 2.509765625, 2.65185546875, 2.7939453125, 2.93603515625, 3.078125, 3.22021484375, 3.3623046875, 3.50439453125, 3.646484375, 3.78857421875, 3.9306640625, 4.07275390625, 4.21484375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 6.0, 7.0, 8.0, 7.0, 11.0, 13.0, 27.0, 40.0, 44.0, 50.0, 97.0, 149.0, 198.0, 307.0, 456.0, 723.0, 1133.0, 1810.0, 3281.0, 5879.0, 12576.0, 28659.0, 78184.0, 330945.0, 430200.0, 92153.0, 32300.0, 13745.0, 6626.0, 3544.0, 1957.0, 1197.0, 751.0, 458.0, 313.0, 251.0, 118.0, 85.0, 79.0, 57.0, 34.0, 14.0, 23.0, 15.0, 13.0, 6.0, 2.0, 4.0, 1.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.13671875, -3.02880859375, -2.9208984375, -2.81298828125, -2.705078125, -2.59716796875, -2.4892578125, -2.38134765625, -2.2734375, -2.16552734375, -2.0576171875, -1.94970703125, -1.841796875, -1.73388671875, -1.6259765625, -1.51806640625, -1.41015625, -1.30224609375, -1.1943359375, -1.08642578125, -0.978515625, -0.87060546875, -0.7626953125, -0.65478515625, -0.546875, -0.43896484375, -0.3310546875, -0.22314453125, -0.115234375, -0.00732421875, 0.1005859375, 0.20849609375, 0.31640625, 0.42431640625, 0.5322265625, 0.64013671875, 0.748046875, 0.85595703125, 0.9638671875, 1.07177734375, 1.1796875, 1.28759765625, 1.3955078125, 1.50341796875, 1.611328125, 1.71923828125, 1.8271484375, 1.93505859375, 2.04296875, 2.15087890625, 2.2587890625, 2.36669921875, 2.474609375, 2.58251953125, 2.6904296875, 2.79833984375, 2.90625, 3.01416015625, 3.1220703125, 3.22998046875, 3.337890625, 3.44580078125, 3.5537109375, 3.66162109375, 3.76953125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 1.0, 2.0, 2.0, 11.0, 12.0, 11.0, 12.0, 7.0, 21.0, 23.0, 22.0, 19.0, 25.0, 23.0, 39.0, 33.0, 36.0, 36.0, 44.0, 45.0, 46.0, 43.0, 48.0, 46.0, 44.0, 43.0, 46.0, 39.0, 33.0, 24.0, 26.0, 26.0, 18.0, 21.0, 15.0, 12.0, 16.0, 11.0, 12.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.251953125, -3.1412353515625, -3.030517578125, -2.9197998046875, -2.80908203125, -2.6983642578125, -2.587646484375, -2.4769287109375, -2.3662109375, -2.2554931640625, -2.144775390625, -2.0340576171875, -1.92333984375, -1.8126220703125, -1.701904296875, -1.5911865234375, -1.48046875, -1.3697509765625, -1.259033203125, -1.1483154296875, -1.03759765625, -0.9268798828125, -0.816162109375, -0.7054443359375, -0.5947265625, -0.4840087890625, -0.373291015625, -0.2625732421875, -0.15185546875, -0.0411376953125, 0.069580078125, 0.1802978515625, 0.291015625, 0.4017333984375, 0.512451171875, 0.6231689453125, 0.73388671875, 0.8446044921875, 0.955322265625, 1.0660400390625, 1.1767578125, 1.2874755859375, 1.398193359375, 1.5089111328125, 1.61962890625, 1.7303466796875, 1.841064453125, 1.9517822265625, 2.0625, 2.1732177734375, 2.283935546875, 2.3946533203125, 2.50537109375, 2.6160888671875, 2.726806640625, 2.8375244140625, 2.9482421875, 3.0589599609375, 3.169677734375, 3.2803955078125, 3.39111328125, 3.5018310546875, 3.612548828125, 3.7232666015625, 3.833984375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 6.0, 1.0, 8.0, 5.0, 11.0, 11.0, 16.0, 28.0, 38.0, 56.0, 72.0, 102.0, 183.0, 259.0, 375.0, 562.0, 944.0, 1613.0, 2713.0, 5260.0, 10141.0, 22257.0, 58100.0, 218437.0, 563971.0, 99174.0, 33751.0, 14442.0, 6907.0, 3708.0, 2081.0, 1201.0, 733.0, 479.0, 318.0, 175.0, 117.0, 106.0, 58.0, 42.0, 29.0, 23.0, 6.0, 12.0, 13.0, 8.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.51953125, -0.501129150390625, -0.48272705078125, -0.464324951171875, -0.4459228515625, -0.427520751953125, -0.40911865234375, -0.390716552734375, -0.372314453125, -0.353912353515625, -0.33551025390625, -0.317108154296875, -0.2987060546875, -0.280303955078125, -0.26190185546875, -0.243499755859375, -0.22509765625, -0.206695556640625, -0.18829345703125, -0.169891357421875, -0.1514892578125, -0.133087158203125, -0.11468505859375, -0.096282958984375, -0.077880859375, -0.059478759765625, -0.04107666015625, -0.022674560546875, -0.0042724609375, 0.014129638671875, 0.03253173828125, 0.050933837890625, 0.0693359375, 0.087738037109375, 0.10614013671875, 0.124542236328125, 0.1429443359375, 0.161346435546875, 0.17974853515625, 0.198150634765625, 0.216552734375, 0.234954833984375, 0.25335693359375, 0.271759033203125, 0.2901611328125, 0.308563232421875, 0.32696533203125, 0.345367431640625, 0.36376953125, 0.382171630859375, 0.40057373046875, 0.418975830078125, 0.4373779296875, 0.455780029296875, 0.47418212890625, 0.492584228515625, 0.510986328125, 0.529388427734375, 0.54779052734375, 0.566192626953125, 0.5845947265625, 0.602996826171875, 0.62139892578125, 0.639801025390625, 0.658203125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 3.0, 7.0, 12.0, 9.0, 24.0, 22.0, 45.0, 61.0, 87.0, 169.0, 186.0, 134.0, 81.0, 50.0, 33.0, 23.0, 21.0, 8.0, 9.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.937980651855469e-05, -6.746780127286911e-05, -6.555579602718353e-05, -6.364379078149796e-05, -6.173178553581238e-05, -5.98197802901268e-05, -5.790777504444122e-05, -5.5995769798755646e-05, -5.408376455307007e-05, -5.217175930738449e-05, -5.0259754061698914e-05, -4.8347748816013336e-05, -4.643574357032776e-05, -4.452373832464218e-05, -4.2611733078956604e-05, -4.0699727833271027e-05, -3.878772258758545e-05, -3.687571734189987e-05, -3.4963712096214294e-05, -3.305170685052872e-05, -3.113970160484314e-05, -2.9227696359157562e-05, -2.7315691113471985e-05, -2.5403685867786407e-05, -2.349168062210083e-05, -2.1579675376415253e-05, -1.9667670130729675e-05, -1.7755664885044098e-05, -1.584365963935852e-05, -1.3931654393672943e-05, -1.2019649147987366e-05, -1.0107643902301788e-05, -8.195638656616211e-06, -6.2836334109306335e-06, -4.371628165245056e-06, -2.4596229195594788e-06, -5.476176738739014e-07, 1.364387571811676e-06, 3.2763928174972534e-06, 5.188398063182831e-06, 7.100403308868408e-06, 9.012408554553986e-06, 1.0924413800239563e-05, 1.283641904592514e-05, 1.4748424291610718e-05, 1.6660429537296295e-05, 1.8572434782981873e-05, 2.048444002866745e-05, 2.2396445274353027e-05, 2.4308450520038605e-05, 2.6220455765724182e-05, 2.813246101140976e-05, 3.0044466257095337e-05, 3.1956471502780914e-05, 3.386847674846649e-05, 3.578048199415207e-05, 3.7692487239837646e-05, 3.9604492485523224e-05, 4.15164977312088e-05, 4.342850297689438e-05, 4.5340508222579956e-05, 4.7252513468265533e-05, 4.916451871395111e-05, 5.107652395963669e-05, 5.2988529205322266e-05]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 8.0, 17.0, 20.0, 22.0, 49.0, 62.0, 77.0, 133.0, 196.0, 277.0, 389.0, 574.0, 916.0, 1309.0, 2020.0, 3116.0, 4883.0, 8082.0, 13666.0, 25353.0, 52802.0, 149600.0, 526457.0, 145683.0, 52147.0, 25056.0, 13680.0, 7889.0, 4910.0, 3163.0, 1944.0, 1318.0, 897.0, 605.0, 383.0, 263.0, 185.0, 124.0, 80.0, 62.0, 50.0, 29.0, 19.0, 14.0, 10.0, 7.0, 0.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7451171875, -0.7206802368164062, -0.6962432861328125, -0.6718063354492188, -0.647369384765625, -0.6229324340820312, -0.5984954833984375, -0.5740585327148438, -0.54962158203125, -0.5251846313476562, -0.5007476806640625, -0.47631072998046875, -0.451873779296875, -0.42743682861328125, -0.4029998779296875, -0.37856292724609375, -0.3541259765625, -0.32968902587890625, -0.3052520751953125, -0.28081512451171875, -0.256378173828125, -0.23194122314453125, -0.2075042724609375, -0.18306732177734375, -0.15863037109375, -0.13419342041015625, -0.1097564697265625, -0.08531951904296875, -0.060882568359375, -0.03644561767578125, -0.0120086669921875, 0.01242828369140625, 0.036865234375, 0.06130218505859375, 0.0857391357421875, 0.11017608642578125, 0.134613037109375, 0.15904998779296875, 0.1834869384765625, 0.20792388916015625, 0.23236083984375, 0.25679779052734375, 0.2812347412109375, 0.30567169189453125, 0.330108642578125, 0.35454559326171875, 0.3789825439453125, 0.40341949462890625, 0.4278564453125, 0.45229339599609375, 0.4767303466796875, 0.5011672973632812, 0.525604248046875, 0.5500411987304688, 0.5744781494140625, 0.5989151000976562, 0.62335205078125, 0.6477890014648438, 0.6722259521484375, 0.6966629028320312, 0.721099853515625, 0.7455368041992188, 0.7699737548828125, 0.7944107055664062, 0.81884765625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 3.0, 9.0, 9.0, 4.0, 10.0, 6.0, 12.0, 7.0, 13.0, 26.0, 20.0, 23.0, 34.0, 34.0, 36.0, 56.0, 51.0, 69.0, 155.0, 74.0, 67.0, 40.0, 35.0, 27.0, 18.0, 22.0, 19.0, 20.0, 15.0, 13.0, 8.0, 17.0, 11.0, 10.0, 2.0, 6.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2034912109375, -0.1972522735595703, -0.19101333618164062, -0.18477439880371094, -0.17853546142578125, -0.17229652404785156, -0.16605758666992188, -0.1598186492919922, -0.1535797119140625, -0.1473407745361328, -0.14110183715820312, -0.13486289978027344, -0.12862396240234375, -0.12238502502441406, -0.11614608764648438, -0.10990715026855469, -0.103668212890625, -0.09742927551269531, -0.09119033813476562, -0.08495140075683594, -0.07871246337890625, -0.07247352600097656, -0.06623458862304688, -0.05999565124511719, -0.0537567138671875, -0.04751777648925781, -0.041278839111328125, -0.03503990173339844, -0.02880096435546875, -0.022562026977539062, -0.016323089599609375, -0.010084152221679688, -0.00384521484375, 0.0023937225341796875, 0.008632659912109375, 0.014871597290039062, 0.02111053466796875, 0.027349472045898438, 0.033588409423828125, 0.03982734680175781, 0.0460662841796875, 0.05230522155761719, 0.058544158935546875, 0.06478309631347656, 0.07102203369140625, 0.07726097106933594, 0.08349990844726562, 0.08973884582519531, 0.095977783203125, 0.10221672058105469, 0.10845565795898438, 0.11469459533691406, 0.12093353271484375, 0.12717247009277344, 0.13341140747070312, 0.1396503448486328, 0.1458892822265625, 0.1521282196044922, 0.15836715698242188, 0.16460609436035156, 0.17084503173828125, 0.17708396911621094, 0.18332290649414062, 0.1895618438720703, 0.19580078125]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 3.0, 7.0, 6.0, 10.0, 15.0, 21.0, 25.0, 33.0, 56.0, 77.0, 117.0, 135.0, 132.0, 106.0, 57.0, 51.0, 28.0, 33.0, 22.0, 15.0, 13.0, 8.0, 1.0, 12.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.710054397583008, -8.437118530273438, -8.16418170928955, -7.891245365142822, -7.618309020996094, -7.345373153686523, -7.072436809539795, -6.799500465393066, -6.526564121246338, -6.253627777099609, -5.980691432952881, -5.707755088806152, -5.434819221496582, -5.161882400512695, -4.888946533203125, -4.6160101890563965, -4.343073844909668, -4.0701375007629395, -3.797201156616211, -3.5242650508880615, -3.251328706741333, -2.9783923625946045, -2.705456256866455, -2.4325199127197266, -2.159583568572998, -1.8866472244262695, -1.6137109994888306, -1.3407747745513916, -1.067838430404663, -0.7949020862579346, -0.5219658613204956, -0.24902963638305664, 0.02390575408935547, 0.2968420386314392, 0.569778323173523, 0.8427146077156067, 1.1156508922576904, 1.388587236404419, 1.661523461341858, 1.9344596862792969, 2.2073960304260254, 2.480332374572754, 2.7532687187194824, 3.026204824447632, 3.2991411685943604, 3.572077512741089, 3.8450136184692383, 4.117949962615967, 4.390886306762695, 4.663822650909424, 4.936758995056152, 5.209695339202881, 5.482631683349609, 5.75556755065918, 6.028503894805908, 6.301440238952637, 6.574376583099365, 6.847312927246094, 7.120249271392822, 7.393185615539551, 7.666121482849121, 7.939058303833008, 8.211994171142578, 8.484930038452148, 8.757866859436035]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 9.0, 7.0, 3.0, 12.0, 14.0, 10.0, 15.0, 12.0, 30.0, 21.0, 23.0, 23.0, 30.0, 37.0, 37.0, 24.0, 38.0, 29.0, 49.0, 38.0, 39.0, 31.0, 32.0, 32.0, 37.0, 37.0, 40.0, 31.0, 41.0, 27.0, 29.0, 24.0, 25.0, 17.0, 11.0, 15.0, 10.0, 13.0, 8.0, 13.0, 8.0, 6.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-5.03795051574707, -4.89420223236084, -4.750453948974609, -4.606705188751221, -4.46295690536499, -4.31920862197876, -4.175459861755371, -4.031711578369141, -3.88796329498291, -3.7442150115966797, -3.60046648979187, -3.4567179679870605, -3.31296968460083, -3.1692214012145996, -3.02547287940979, -2.8817243576049805, -2.73797607421875, -2.5942277908325195, -2.45047926902771, -2.3067307472229004, -2.16298246383667, -2.0192341804504395, -1.8754856586456299, -1.7317372560501099, -1.5879888534545898, -1.4442404508590698, -1.3004920482635498, -1.1567436456680298, -1.0129952430725098, -0.8692468404769897, -0.7254984378814697, -0.5817500352859497, -0.4380021095275879, -0.29425370693206787, -0.15050530433654785, -0.006756901741027832, 0.1369915008544922, 0.2807399034500122, 0.4244883060455322, 0.5682367086410522, 0.7119851112365723, 0.8557335138320923, 0.9994819164276123, 1.1432303190231323, 1.2869787216186523, 1.4307271242141724, 1.5744755268096924, 1.7182239294052124, 1.8619723320007324, 2.005720615386963, 2.1494691371917725, 2.293217658996582, 2.4369659423828125, 2.580714225769043, 2.7244627475738525, 2.868211269378662, 3.0119595527648926, 3.155707836151123, 3.2994563579559326, 3.443204879760742, 3.5869531631469727, 3.730701446533203, 3.8744499683380127, 4.018198490142822, 4.161946773529053]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 0.0, 7.0, 11.0, 24.0, 30.0, 41.0, 50.0, 83.0, 121.0, 149.0, 226.0, 358.0, 463.0, 733.0, 970.0, 1463.0, 2194.0, 3339.0, 5023.0, 7965.0, 12532.0, 20081.0, 34081.0, 58654.0, 103513.0, 192936.0, 252640.0, 148751.0, 81932.0, 46314.0, 27362.0, 16611.0, 10438.0, 6400.0, 4240.0, 2827.0, 1894.0, 1235.0, 876.0, 599.0, 451.0, 293.0, 199.0, 146.0, 98.0, 66.0, 44.0, 35.0, 28.0, 12.0, 11.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-7.953125, -7.70684814453125, -7.4605712890625, -7.21429443359375, -6.968017578125, -6.72174072265625, -6.4754638671875, -6.22918701171875, -5.98291015625, -5.73663330078125, -5.4903564453125, -5.24407958984375, -4.997802734375, -4.75152587890625, -4.5052490234375, -4.25897216796875, -4.0126953125, -3.76641845703125, -3.5201416015625, -3.27386474609375, -3.027587890625, -2.78131103515625, -2.5350341796875, -2.28875732421875, -2.04248046875, -1.79620361328125, -1.5499267578125, -1.30364990234375, -1.057373046875, -0.81109619140625, -0.5648193359375, -0.31854248046875, -0.072265625, 0.17401123046875, 0.4202880859375, 0.66656494140625, 0.912841796875, 1.15911865234375, 1.4053955078125, 1.65167236328125, 1.89794921875, 2.14422607421875, 2.3905029296875, 2.63677978515625, 2.883056640625, 3.12933349609375, 3.3756103515625, 3.62188720703125, 3.8681640625, 4.11444091796875, 4.3607177734375, 4.60699462890625, 4.853271484375, 5.09954833984375, 5.3458251953125, 5.59210205078125, 5.83837890625, 6.08465576171875, 6.3309326171875, 6.57720947265625, 6.823486328125, 7.06976318359375, 7.3160400390625, 7.56231689453125, 7.80859375]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 5.0, 4.0, 3.0, 12.0, 11.0, 17.0, 9.0, 15.0, 11.0, 20.0, 26.0, 25.0, 30.0, 38.0, 34.0, 26.0, 33.0, 33.0, 35.0, 39.0, 46.0, 48.0, 51.0, 32.0, 34.0, 37.0, 38.0, 34.0, 33.0, 38.0, 25.0, 22.0, 22.0, 22.0, 16.0, 15.0, 15.0, 14.0, 7.0, 9.0, 6.0, 3.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 3.0], "bins": [-4.87890625, -4.745025634765625, -4.61114501953125, -4.477264404296875, -4.3433837890625, -4.209503173828125, -4.07562255859375, -3.941741943359375, -3.807861328125, -3.673980712890625, -3.54010009765625, -3.406219482421875, -3.2723388671875, -3.138458251953125, -3.00457763671875, -2.870697021484375, -2.73681640625, -2.602935791015625, -2.46905517578125, -2.335174560546875, -2.2012939453125, -2.067413330078125, -1.93353271484375, -1.799652099609375, -1.665771484375, -1.531890869140625, -1.39801025390625, -1.264129638671875, -1.1302490234375, -0.996368408203125, -0.86248779296875, -0.728607177734375, -0.5947265625, -0.460845947265625, -0.32696533203125, -0.193084716796875, -0.0592041015625, 0.074676513671875, 0.20855712890625, 0.342437744140625, 0.476318359375, 0.610198974609375, 0.74407958984375, 0.877960205078125, 1.0118408203125, 1.145721435546875, 1.27960205078125, 1.413482666015625, 1.54736328125, 1.681243896484375, 1.81512451171875, 1.949005126953125, 2.0828857421875, 2.216766357421875, 2.35064697265625, 2.484527587890625, 2.618408203125, 2.752288818359375, 2.88616943359375, 3.020050048828125, 3.1539306640625, 3.287811279296875, 3.42169189453125, 3.555572509765625, 3.689453125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 8.0, 11.0, 14.0, 6.0, 21.0, 39.0, 49.0, 67.0, 91.0, 151.0, 229.0, 335.0, 511.0, 840.0, 1406.0, 2424.0, 4209.0, 7445.0, 13977.0, 26116.0, 51172.0, 104954.0, 226910.0, 305786.0, 151075.0, 72089.0, 35821.0, 18967.0, 10127.0, 5699.0, 3107.0, 1858.0, 1120.0, 642.0, 463.0, 266.0, 184.0, 114.0, 77.0, 57.0, 35.0, 33.0, 14.0, 9.0, 4.0, 7.0, 6.0, 7.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.3203125, -9.03125, -8.7421875, -8.453125, -8.1640625, -7.875, -7.5859375, -7.296875, -7.0078125, -6.71875, -6.4296875, -6.140625, -5.8515625, -5.5625, -5.2734375, -4.984375, -4.6953125, -4.40625, -4.1171875, -3.828125, -3.5390625, -3.25, -2.9609375, -2.671875, -2.3828125, -2.09375, -1.8046875, -1.515625, -1.2265625, -0.9375, -0.6484375, -0.359375, -0.0703125, 0.21875, 0.5078125, 0.796875, 1.0859375, 1.375, 1.6640625, 1.953125, 2.2421875, 2.53125, 2.8203125, 3.109375, 3.3984375, 3.6875, 3.9765625, 4.265625, 4.5546875, 4.84375, 5.1328125, 5.421875, 5.7109375, 6.0, 6.2890625, 6.578125, 6.8671875, 7.15625, 7.4453125, 7.734375, 8.0234375, 8.3125, 8.6015625, 8.890625, 9.1796875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 2.0, 5.0, 11.0, 7.0, 11.0, 12.0, 13.0, 20.0, 15.0, 22.0, 12.0, 21.0, 31.0, 27.0, 34.0, 28.0, 35.0, 36.0, 42.0, 35.0, 39.0, 43.0, 42.0, 41.0, 30.0, 35.0, 40.0, 32.0, 26.0, 29.0, 35.0, 27.0, 17.0, 16.0, 22.0, 14.0, 19.0, 12.0, 4.0, 9.0, 7.0, 7.0, 2.0, 7.0, 2.0, 9.0, 7.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0], "bins": [-2.55078125, -2.470794677734375, -2.39080810546875, -2.310821533203125, -2.2308349609375, -2.150848388671875, -2.07086181640625, -1.990875244140625, -1.910888671875, -1.830902099609375, -1.75091552734375, -1.670928955078125, -1.5909423828125, -1.510955810546875, -1.43096923828125, -1.350982666015625, -1.27099609375, -1.191009521484375, -1.11102294921875, -1.031036376953125, -0.9510498046875, -0.871063232421875, -0.79107666015625, -0.711090087890625, -0.631103515625, -0.551116943359375, -0.47113037109375, -0.391143798828125, -0.3111572265625, -0.231170654296875, -0.15118408203125, -0.071197509765625, 0.0087890625, 0.088775634765625, 0.16876220703125, 0.248748779296875, 0.3287353515625, 0.408721923828125, 0.48870849609375, 0.568695068359375, 0.648681640625, 0.728668212890625, 0.80865478515625, 0.888641357421875, 0.9686279296875, 1.048614501953125, 1.12860107421875, 1.208587646484375, 1.28857421875, 1.368560791015625, 1.44854736328125, 1.528533935546875, 1.6085205078125, 1.688507080078125, 1.76849365234375, 1.848480224609375, 1.928466796875, 2.008453369140625, 2.08843994140625, 2.168426513671875, 2.2484130859375, 2.328399658203125, 2.40838623046875, 2.488372802734375, 2.568359375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 2.0, 3.0, 5.0, 3.0, 9.0, 11.0, 17.0, 19.0, 28.0, 41.0, 67.0, 86.0, 121.0, 195.0, 286.0, 418.0, 616.0, 963.0, 1573.0, 2546.0, 4228.0, 7375.0, 13568.0, 26798.0, 59778.0, 350008.0, 460260.0, 60152.0, 26998.0, 13599.0, 7499.0, 4284.0, 2513.0, 1624.0, 916.0, 646.0, 440.0, 260.0, 195.0, 111.0, 95.0, 57.0, 39.0, 33.0, 23.0, 18.0, 13.0, 10.0, 3.0, 8.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.16796875, -6.92083740234375, -6.6737060546875, -6.42657470703125, -6.179443359375, -5.93231201171875, -5.6851806640625, -5.43804931640625, -5.19091796875, -4.94378662109375, -4.6966552734375, -4.44952392578125, -4.202392578125, -3.95526123046875, -3.7081298828125, -3.46099853515625, -3.2138671875, -2.96673583984375, -2.7196044921875, -2.47247314453125, -2.225341796875, -1.97821044921875, -1.7310791015625, -1.48394775390625, -1.23681640625, -0.98968505859375, -0.7425537109375, -0.49542236328125, -0.248291015625, -0.00115966796875, 0.2459716796875, 0.49310302734375, 0.740234375, 0.98736572265625, 1.2344970703125, 1.48162841796875, 1.728759765625, 1.97589111328125, 2.2230224609375, 2.47015380859375, 2.71728515625, 2.96441650390625, 3.2115478515625, 3.45867919921875, 3.705810546875, 3.95294189453125, 4.2000732421875, 4.44720458984375, 4.6943359375, 4.94146728515625, 5.1885986328125, 5.43572998046875, 5.682861328125, 5.92999267578125, 6.1771240234375, 6.42425537109375, 6.67138671875, 6.91851806640625, 7.1656494140625, 7.41278076171875, 7.659912109375, 7.90704345703125, 8.1541748046875, 8.40130615234375, 8.6484375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 7.0, 7.0, 13.0, 6.0, 12.0, 20.0, 24.0, 56.0, 69.0, 133.0, 359.0, 107.0, 40.0, 32.0, 31.0, 12.0, 10.0, 14.0, 7.0, 6.0, 4.0, 8.0, 0.0, 2.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00040841102600097656, -0.00039534643292427063, -0.0003822818398475647, -0.00036921724677085876, -0.00035615265369415283, -0.0003430880606174469, -0.00033002346754074097, -0.00031695887446403503, -0.0003038942813873291, -0.00029082968831062317, -0.00027776509523391724, -0.0002647005021572113, -0.00025163590908050537, -0.00023857131600379944, -0.0002255067229270935, -0.00021244212985038757, -0.00019937753677368164, -0.0001863129436969757, -0.00017324835062026978, -0.00016018375754356384, -0.0001471191644668579, -0.00013405457139015198, -0.00012098997831344604, -0.00010792538523674011, -9.486079216003418e-05, -8.179619908332825e-05, -6.873160600662231e-05, -5.566701292991638e-05, -4.260241985321045e-05, -2.9537826776504517e-05, -1.6473233699798584e-05, -3.4086406230926514e-06, 9.655952453613281e-06, 2.2720545530319214e-05, 3.5785138607025146e-05, 4.884973168373108e-05, 6.191432476043701e-05, 7.497891783714294e-05, 8.804351091384888e-05, 0.00010110810399055481, 0.00011417269706726074, 0.00012723729014396667, 0.0001403018832206726, 0.00015336647629737854, 0.00016643106937408447, 0.0001794956624507904, 0.00019256025552749634, 0.00020562484860420227, 0.0002186894416809082, 0.00023175403475761414, 0.00024481862783432007, 0.000257883220911026, 0.00027094781398773193, 0.00028401240706443787, 0.0002970770001411438, 0.00031014159321784973, 0.00032320618629455566, 0.0003362707793712616, 0.00034933537244796753, 0.00036239996552467346, 0.0003754645586013794, 0.00038852915167808533, 0.00040159374475479126, 0.0004146583378314972, 0.0004277229309082031]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 8.0, 2.0, 7.0, 20.0, 28.0, 36.0, 50.0, 100.0, 122.0, 181.0, 273.0, 429.0, 625.0, 1006.0, 1654.0, 2813.0, 4927.0, 9743.0, 21011.0, 54201.0, 351684.0, 501318.0, 54789.0, 21479.0, 9746.0, 4879.0, 2824.0, 1646.0, 1001.0, 649.0, 419.0, 301.0, 201.0, 128.0, 85.0, 61.0, 36.0, 25.0, 12.0, 17.0, 6.0, 6.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.171875, -7.8995361328125, -7.627197265625, -7.3548583984375, -7.08251953125, -6.8101806640625, -6.537841796875, -6.2655029296875, -5.9931640625, -5.7208251953125, -5.448486328125, -5.1761474609375, -4.90380859375, -4.6314697265625, -4.359130859375, -4.0867919921875, -3.814453125, -3.5421142578125, -3.269775390625, -2.9974365234375, -2.72509765625, -2.4527587890625, -2.180419921875, -1.9080810546875, -1.6357421875, -1.3634033203125, -1.091064453125, -0.8187255859375, -0.54638671875, -0.2740478515625, -0.001708984375, 0.2706298828125, 0.54296875, 0.8153076171875, 1.087646484375, 1.3599853515625, 1.63232421875, 1.9046630859375, 2.177001953125, 2.4493408203125, 2.7216796875, 2.9940185546875, 3.266357421875, 3.5386962890625, 3.81103515625, 4.0833740234375, 4.355712890625, 4.6280517578125, 4.900390625, 5.1727294921875, 5.445068359375, 5.7174072265625, 5.98974609375, 6.2620849609375, 6.534423828125, 6.8067626953125, 7.0791015625, 7.3514404296875, 7.623779296875, 7.8961181640625, 8.16845703125, 8.4407958984375, 8.713134765625, 8.9854736328125, 9.2578125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 5.0, 7.0, 5.0, 10.0, 9.0, 10.0, 21.0, 24.0, 31.0, 33.0, 31.0, 51.0, 44.0, 427.0, 43.0, 52.0, 27.0, 35.0, 24.0, 23.0, 19.0, 14.0, 10.0, 10.0, 5.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.353515625, -2.2892303466796875, -2.224945068359375, -2.1606597900390625, -2.09637451171875, -2.0320892333984375, -1.967803955078125, -1.9035186767578125, -1.8392333984375, -1.7749481201171875, -1.710662841796875, -1.6463775634765625, -1.58209228515625, -1.5178070068359375, -1.453521728515625, -1.3892364501953125, -1.324951171875, -1.2606658935546875, -1.196380615234375, -1.1320953369140625, -1.06781005859375, -1.0035247802734375, -0.939239501953125, -0.8749542236328125, -0.8106689453125, -0.7463836669921875, -0.682098388671875, -0.6178131103515625, -0.55352783203125, -0.4892425537109375, -0.424957275390625, -0.3606719970703125, -0.29638671875, -0.2321014404296875, -0.167816162109375, -0.1035308837890625, -0.03924560546875, 0.0250396728515625, 0.089324951171875, 0.1536102294921875, 0.2178955078125, 0.2821807861328125, 0.346466064453125, 0.4107513427734375, 0.47503662109375, 0.5393218994140625, 0.603607177734375, 0.6678924560546875, 0.732177734375, 0.7964630126953125, 0.860748291015625, 0.9250335693359375, 0.98931884765625, 1.0536041259765625, 1.117889404296875, 1.1821746826171875, 1.2464599609375, 1.3107452392578125, 1.375030517578125, 1.4393157958984375, 1.50360107421875, 1.5678863525390625, 1.632171630859375, 1.6964569091796875, 1.7607421875]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 12.0, 11.0, 7.0, 15.0, 26.0, 37.0, 37.0, 60.0, 77.0, 106.0, 160.0, 109.0, 90.0, 53.0, 49.0, 42.0, 15.0, 22.0, 14.0, 12.0, 13.0, 13.0, 6.0, 1.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.313016414642334, -7.080687046051025, -6.848357677459717, -6.61602783203125, -6.383698463439941, -6.151369094848633, -5.919039726257324, -5.686710357666016, -5.454380989074707, -5.222051620483398, -4.98972225189209, -4.757392883300781, -4.5250630378723145, -4.292733669281006, -4.060404300689697, -3.8280749320983887, -3.595745086669922, -3.3634157180786133, -3.1310861110687256, -2.898756742477417, -2.6664271354675293, -2.4340977668762207, -2.201768398284912, -1.969438910484314, -1.7371094226837158, -1.5047799348831177, -1.2724504470825195, -1.040121078491211, -0.8077915906906128, -0.5754621028900146, -0.34313273429870605, -0.11080324649810791, 0.12152576446533203, 0.3538552224636078, 0.5861846804618835, 0.8185141086578369, 1.050843596458435, 1.2831730842590332, 1.5155024528503418, 1.74783194065094, 1.980161428451538, 2.2124907970428467, 2.4448204040527344, 2.677149772644043, 2.9094791412353516, 3.1418087482452393, 3.374138116836548, 3.6064677238464355, 3.838797092437744, 4.071126461029053, 4.303455829620361, 4.535785675048828, 4.768115043640137, 5.000444412231445, 5.232773780822754, 5.4651031494140625, 5.697432518005371, 5.92976188659668, 6.162091255187988, 6.394420623779297, 6.626750469207764, 6.859079837799072, 7.091409206390381, 7.3237385749816895, 7.556068420410156]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 8.0, 7.0, 12.0, 10.0, 15.0, 14.0, 18.0, 26.0, 17.0, 24.0, 28.0, 30.0, 32.0, 26.0, 39.0, 40.0, 41.0, 46.0, 47.0, 35.0, 33.0, 31.0, 31.0, 41.0, 31.0, 30.0, 34.0, 34.0, 39.0, 18.0, 21.0, 20.0, 24.0, 21.0, 13.0, 7.0, 10.0, 6.0, 3.0, 11.0, 7.0, 3.0, 0.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.222689628601074, -4.089003562927246, -3.955317258834839, -3.8216309547424316, -3.6879448890686035, -3.5542585849761963, -3.420572280883789, -3.286886215209961, -3.1531999111175537, -3.0195136070251465, -2.8858275413513184, -2.752141237258911, -2.618454933166504, -2.484768867492676, -2.3510825634002686, -2.2173962593078613, -2.083710193634033, -1.9500240087509155, -1.8163378238677979, -1.6826515197753906, -1.548965334892273, -1.4152791500091553, -1.281592845916748, -1.1479066610336304, -1.0142204761505127, -0.880534291267395, -0.7468480467796326, -0.6131618022918701, -0.47947561740875244, -0.34578943252563477, -0.21210318803787231, -0.07841694355010986, 0.055269718170166016, 0.18895593285560608, 0.32264214754104614, 0.4563283622264862, 0.5900145769119263, 0.723700761795044, 0.8573870062828064, 0.9910732507705688, 1.1247594356536865, 1.2584456205368042, 1.3921318054199219, 1.525818109512329, 1.6595042943954468, 1.7931904792785645, 1.9268767833709717, 2.060563087463379, 2.194249153137207, 2.3279354572296143, 2.4616215229034424, 2.5953078269958496, 2.7289938926696777, 2.862680196762085, 2.996366500854492, 3.1300525665283203, 3.2637388706207275, 3.3974251747131348, 3.531111240386963, 3.66479754447937, 3.7984838485717773, 3.9321699142456055, 4.065855979919434, 4.19954252243042, 4.333228588104248]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 3.0, 9.0, 16.0, 30.0, 36.0, 50.0, 55.0, 108.0, 193.0, 288.0, 426.0, 651.0, 1120.0, 1712.0, 2653.0, 4299.0, 7019.0, 11922.0, 21077.0, 38390.0, 74737.0, 161060.0, 458158.0, 1895819.0, 1033590.0, 254763.0, 106453.0, 51978.0, 27885.0, 15592.0, 9166.0, 5650.0, 3505.0, 2185.0, 1350.0, 844.0, 507.0, 331.0, 221.0, 144.0, 80.0, 79.0, 44.0, 36.0, 15.0, 13.0, 5.0, 12.0, 6.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.57421875, -6.353271484375, -6.13232421875, -5.911376953125, -5.6904296875, -5.469482421875, -5.24853515625, -5.027587890625, -4.806640625, -4.585693359375, -4.36474609375, -4.143798828125, -3.9228515625, -3.701904296875, -3.48095703125, -3.260009765625, -3.0390625, -2.818115234375, -2.59716796875, -2.376220703125, -2.1552734375, -1.934326171875, -1.71337890625, -1.492431640625, -1.271484375, -1.050537109375, -0.82958984375, -0.608642578125, -0.3876953125, -0.166748046875, 0.05419921875, 0.275146484375, 0.49609375, 0.717041015625, 0.93798828125, 1.158935546875, 1.3798828125, 1.600830078125, 1.82177734375, 2.042724609375, 2.263671875, 2.484619140625, 2.70556640625, 2.926513671875, 3.1474609375, 3.368408203125, 3.58935546875, 3.810302734375, 4.03125, 4.252197265625, 4.47314453125, 4.694091796875, 4.9150390625, 5.135986328125, 5.35693359375, 5.577880859375, 5.798828125, 6.019775390625, 6.24072265625, 6.461669921875, 6.6826171875, 6.903564453125, 7.12451171875, 7.345458984375, 7.56640625]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 11.0, 7.0, 7.0, 5.0, 13.0, 9.0, 10.0, 21.0, 18.0, 23.0, 17.0, 22.0, 27.0, 35.0, 33.0, 39.0, 26.0, 40.0, 52.0, 48.0, 48.0, 34.0, 37.0, 40.0, 31.0, 47.0, 33.0, 42.0, 23.0, 22.0, 34.0, 27.0, 27.0, 19.0, 15.0, 11.0, 8.0, 10.0, 8.0, 4.0, 6.0, 4.0, 5.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.044921875, -2.955413818359375, -2.86590576171875, -2.776397705078125, -2.6868896484375, -2.597381591796875, -2.50787353515625, -2.418365478515625, -2.328857421875, -2.239349365234375, -2.14984130859375, -2.060333251953125, -1.9708251953125, -1.881317138671875, -1.79180908203125, -1.702301025390625, -1.61279296875, -1.523284912109375, -1.43377685546875, -1.344268798828125, -1.2547607421875, -1.165252685546875, -1.07574462890625, -0.986236572265625, -0.896728515625, -0.807220458984375, -0.71771240234375, -0.628204345703125, -0.5386962890625, -0.449188232421875, -0.35968017578125, -0.270172119140625, -0.1806640625, -0.091156005859375, -0.00164794921875, 0.087860107421875, 0.1773681640625, 0.266876220703125, 0.35638427734375, 0.445892333984375, 0.535400390625, 0.624908447265625, 0.71441650390625, 0.803924560546875, 0.8934326171875, 0.982940673828125, 1.07244873046875, 1.161956787109375, 1.25146484375, 1.340972900390625, 1.43048095703125, 1.519989013671875, 1.6094970703125, 1.699005126953125, 1.78851318359375, 1.878021240234375, 1.967529296875, 2.057037353515625, 2.14654541015625, 2.236053466796875, 2.3255615234375, 2.415069580078125, 2.50457763671875, 2.594085693359375, 2.68359375]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 9.0, 7.0, 14.0, 17.0, 28.0, 42.0, 61.0, 85.0, 152.0, 231.0, 389.0, 603.0, 993.0, 1617.0, 2676.0, 4564.0, 8038.0, 13928.0, 25192.0, 47966.0, 94017.0, 202780.0, 528468.0, 1662498.0, 987569.0, 326154.0, 138630.0, 67521.0, 34925.0, 19318.0, 10753.0, 6011.0, 3460.0, 2099.0, 1336.0, 781.0, 461.0, 327.0, 180.0, 125.0, 96.0, 63.0, 36.0, 28.0, 18.0, 8.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.75390625, -5.57275390625, -5.3916015625, -5.21044921875, -5.029296875, -4.84814453125, -4.6669921875, -4.48583984375, -4.3046875, -4.12353515625, -3.9423828125, -3.76123046875, -3.580078125, -3.39892578125, -3.2177734375, -3.03662109375, -2.85546875, -2.67431640625, -2.4931640625, -2.31201171875, -2.130859375, -1.94970703125, -1.7685546875, -1.58740234375, -1.40625, -1.22509765625, -1.0439453125, -0.86279296875, -0.681640625, -0.50048828125, -0.3193359375, -0.13818359375, 0.04296875, 0.22412109375, 0.4052734375, 0.58642578125, 0.767578125, 0.94873046875, 1.1298828125, 1.31103515625, 1.4921875, 1.67333984375, 1.8544921875, 2.03564453125, 2.216796875, 2.39794921875, 2.5791015625, 2.76025390625, 2.94140625, 3.12255859375, 3.3037109375, 3.48486328125, 3.666015625, 3.84716796875, 4.0283203125, 4.20947265625, 4.390625, 4.57177734375, 4.7529296875, 4.93408203125, 5.115234375, 5.29638671875, 5.4775390625, 5.65869140625, 5.83984375]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 6.0, 1.0, 11.0, 8.0, 16.0, 20.0, 23.0, 17.0, 26.0, 37.0, 64.0, 54.0, 66.0, 106.0, 108.0, 115.0, 154.0, 172.0, 207.0, 231.0, 285.0, 298.0, 315.0, 273.0, 230.0, 210.0, 180.0, 150.0, 129.0, 108.0, 89.0, 71.0, 71.0, 58.0, 38.0, 21.0, 26.0, 18.0, 12.0, 14.0, 10.0, 7.0, 6.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0], "bins": [-1.6162109375, -1.56878662109375, -1.5213623046875, -1.47393798828125, -1.426513671875, -1.37908935546875, -1.3316650390625, -1.28424072265625, -1.23681640625, -1.18939208984375, -1.1419677734375, -1.09454345703125, -1.047119140625, -0.99969482421875, -0.9522705078125, -0.90484619140625, -0.857421875, -0.80999755859375, -0.7625732421875, -0.71514892578125, -0.667724609375, -0.62030029296875, -0.5728759765625, -0.52545166015625, -0.47802734375, -0.43060302734375, -0.3831787109375, -0.33575439453125, -0.288330078125, -0.24090576171875, -0.1934814453125, -0.14605712890625, -0.0986328125, -0.05120849609375, -0.0037841796875, 0.04364013671875, 0.091064453125, 0.13848876953125, 0.1859130859375, 0.23333740234375, 0.28076171875, 0.32818603515625, 0.3756103515625, 0.42303466796875, 0.470458984375, 0.51788330078125, 0.5653076171875, 0.61273193359375, 0.66015625, 0.70758056640625, 0.7550048828125, 0.80242919921875, 0.849853515625, 0.89727783203125, 0.9447021484375, 0.99212646484375, 1.03955078125, 1.08697509765625, 1.1343994140625, 1.18182373046875, 1.229248046875, 1.27667236328125, 1.3240966796875, 1.37152099609375, 1.4189453125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 6.0, 8.0, 11.0, 15.0, 20.0, 30.0, 56.0, 57.0, 119.0, 161.0, 163.0, 123.0, 79.0, 61.0, 24.0, 17.0, 11.0, 12.0, 10.0, 7.0, 6.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-10.28921890258789, -10.060796737670898, -9.832375526428223, -9.60395336151123, -9.375531196594238, -9.147109985351562, -8.91868782043457, -8.690265655517578, -8.461844444274902, -8.23342227935791, -8.005001068115234, -7.776578903198242, -7.548157215118408, -7.319735050201416, -7.091313362121582, -6.86289119720459, -6.634469032287598, -6.406047344207764, -6.1776251792907715, -5.9492034912109375, -5.7207818031311035, -5.492359638214111, -5.263937950134277, -5.035515785217285, -4.807094573974609, -4.578672885894775, -4.350250720977783, -4.121829032897949, -3.893407106399536, -3.664985179901123, -3.436563491821289, -3.208141565322876, -2.979719638824463, -2.75129771232605, -2.522876024246216, -2.2944540977478027, -2.0660321712493896, -1.8376103639602661, -1.6091885566711426, -1.3807666301727295, -1.152344822883606, -0.9239229559898376, -0.6955010890960693, -0.4670792818069458, -0.2386574149131775, -0.01023554801940918, 0.21818625926971436, 0.44660818576812744, 0.675029993057251, 0.9034518599510193, 1.1318737268447876, 1.3602955341339111, 1.5887174606323242, 1.8171392679214478, 2.0455610752105713, 2.2739830017089844, 2.5024046897888184, 2.7308266162872314, 2.9592483043670654, 3.1876702308654785, 3.4160921573638916, 3.6445140838623047, 3.8729357719421387, 4.101357460021973, 4.329779624938965]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 7.0, 3.0, 8.0, 3.0, 9.0, 7.0, 13.0, 16.0, 26.0, 13.0, 15.0, 22.0, 22.0, 27.0, 27.0, 37.0, 37.0, 30.0, 29.0, 36.0, 37.0, 37.0, 37.0, 40.0, 28.0, 34.0, 37.0, 42.0, 37.0, 38.0, 24.0, 29.0, 28.0, 21.0, 20.0, 24.0, 11.0, 25.0, 9.0, 13.0, 6.0, 12.0, 7.0, 9.0, 5.0, 2.0, 2.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.9738423824310303, -2.881728172302246, -2.789613723754883, -2.6974992752075195, -2.6053850650787354, -2.513270854949951, -2.421156406402588, -2.3290419578552246, -2.2369277477264404, -2.1448135375976562, -2.052699089050293, -1.9605847597122192, -1.8684704303741455, -1.7763561010360718, -1.684241771697998, -1.5921274423599243, -1.5000131130218506, -1.4078987836837769, -1.3157844543457031, -1.2236701250076294, -1.1315557956695557, -1.039441466331482, -0.9473271369934082, -0.8552128076553345, -0.7630984783172607, -0.670984148979187, -0.5788698196411133, -0.48675549030303955, -0.3946411609649658, -0.3025268316268921, -0.21041250228881836, -0.11829817295074463, -0.026183605194091797, 0.06593072414398193, 0.15804505348205566, 0.2501593828201294, 0.3422737121582031, 0.43438804149627686, 0.5265023708343506, 0.6186167001724243, 0.710731029510498, 0.8028453588485718, 0.8949596881866455, 0.9870740175247192, 1.079188346862793, 1.1713026762008667, 1.2634170055389404, 1.3555313348770142, 1.447645664215088, 1.5397599935531616, 1.6318743228912354, 1.723988652229309, 1.8161029815673828, 1.9082173109054565, 2.0003316402435303, 2.0924458503723145, 2.1845602989196777, 2.276674747467041, 2.368788957595825, 2.4609031677246094, 2.5530176162719727, 2.645132064819336, 2.73724627494812, 2.8293604850769043, 2.9214749336242676]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 2.0, 6.0, 5.0, 7.0, 19.0, 19.0, 18.0, 41.0, 56.0, 72.0, 122.0, 140.0, 225.0, 307.0, 398.0, 577.0, 802.0, 1187.0, 1672.0, 2479.0, 3800.0, 6116.0, 10191.0, 17767.0, 33658.0, 70289.0, 171238.0, 380034.0, 187022.0, 76381.0, 35636.0, 18798.0, 10652.0, 6282.0, 4072.0, 2635.0, 1740.0, 1182.0, 838.0, 622.0, 365.0, 306.0, 233.0, 154.0, 112.0, 88.0, 61.0, 47.0, 37.0, 19.0, 11.0, 8.0, 7.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.3564453125, -1.313446044921875, -1.27044677734375, -1.227447509765625, -1.1844482421875, -1.141448974609375, -1.09844970703125, -1.055450439453125, -1.012451171875, -0.969451904296875, -0.92645263671875, -0.883453369140625, -0.8404541015625, -0.797454833984375, -0.75445556640625, -0.711456298828125, -0.66845703125, -0.625457763671875, -0.58245849609375, -0.539459228515625, -0.4964599609375, -0.453460693359375, -0.41046142578125, -0.367462158203125, -0.324462890625, -0.281463623046875, -0.23846435546875, -0.195465087890625, -0.1524658203125, -0.109466552734375, -0.06646728515625, -0.023468017578125, 0.01953125, 0.062530517578125, 0.10552978515625, 0.148529052734375, 0.1915283203125, 0.234527587890625, 0.27752685546875, 0.320526123046875, 0.363525390625, 0.406524658203125, 0.44952392578125, 0.492523193359375, 0.5355224609375, 0.578521728515625, 0.62152099609375, 0.664520263671875, 0.70751953125, 0.750518798828125, 0.79351806640625, 0.836517333984375, 0.8795166015625, 0.922515869140625, 0.96551513671875, 1.008514404296875, 1.051513671875, 1.094512939453125, 1.13751220703125, 1.180511474609375, 1.2235107421875, 1.266510009765625, 1.30950927734375, 1.352508544921875, 1.3955078125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 3.0, 4.0, 11.0, 9.0, 16.0, 16.0, 13.0, 12.0, 25.0, 29.0, 39.0, 25.0, 34.0, 39.0, 35.0, 35.0, 34.0, 34.0, 41.0, 45.0, 37.0, 36.0, 43.0, 35.0, 42.0, 41.0, 41.0, 35.0, 31.0, 25.0, 17.0, 21.0, 17.0, 12.0, 21.0, 7.0, 9.0, 9.0, 8.0, 5.0, 4.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.33203125, -3.2281494140625, -3.124267578125, -3.0203857421875, -2.91650390625, -2.8126220703125, -2.708740234375, -2.6048583984375, -2.5009765625, -2.3970947265625, -2.293212890625, -2.1893310546875, -2.08544921875, -1.9815673828125, -1.877685546875, -1.7738037109375, -1.669921875, -1.5660400390625, -1.462158203125, -1.3582763671875, -1.25439453125, -1.1505126953125, -1.046630859375, -0.9427490234375, -0.8388671875, -0.7349853515625, -0.631103515625, -0.5272216796875, -0.42333984375, -0.3194580078125, -0.215576171875, -0.1116943359375, -0.0078125, 0.0960693359375, 0.199951171875, 0.3038330078125, 0.40771484375, 0.5115966796875, 0.615478515625, 0.7193603515625, 0.8232421875, 0.9271240234375, 1.031005859375, 1.1348876953125, 1.23876953125, 1.3426513671875, 1.446533203125, 1.5504150390625, 1.654296875, 1.7581787109375, 1.862060546875, 1.9659423828125, 2.06982421875, 2.1737060546875, 2.277587890625, 2.3814697265625, 2.4853515625, 2.5892333984375, 2.693115234375, 2.7969970703125, 2.90087890625, 3.0047607421875, 3.108642578125, 3.2125244140625, 3.31640625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 7.0, 11.0, 17.0, 27.0, 41.0, 67.0, 78.0, 105.0, 166.0, 236.0, 352.0, 545.0, 776.0, 1226.0, 2108.0, 3462.0, 6302.0, 12073.0, 26253.0, 64963.0, 221436.0, 497208.0, 126829.0, 43705.0, 18850.0, 9223.0, 4937.0, 2807.0, 1641.0, 1015.0, 705.0, 421.0, 293.0, 208.0, 152.0, 70.0, 53.0, 54.0, 34.0, 25.0, 9.0, 18.0, 12.0, 13.0, 6.0, 3.0, 4.0, 1.0, 0.0, 2.0], "bins": [-2.28515625, -2.2204132080078125, -2.155670166015625, -2.0909271240234375, -2.02618408203125, -1.9614410400390625, -1.896697998046875, -1.8319549560546875, -1.7672119140625, -1.7024688720703125, -1.637725830078125, -1.5729827880859375, -1.50823974609375, -1.4434967041015625, -1.378753662109375, -1.3140106201171875, -1.249267578125, -1.1845245361328125, -1.119781494140625, -1.0550384521484375, -0.99029541015625, -0.9255523681640625, -0.860809326171875, -0.7960662841796875, -0.7313232421875, -0.6665802001953125, -0.601837158203125, -0.5370941162109375, -0.47235107421875, -0.4076080322265625, -0.342864990234375, -0.2781219482421875, -0.21337890625, -0.1486358642578125, -0.083892822265625, -0.0191497802734375, 0.04559326171875, 0.1103363037109375, 0.175079345703125, 0.2398223876953125, 0.3045654296875, 0.3693084716796875, 0.434051513671875, 0.4987945556640625, 0.56353759765625, 0.6282806396484375, 0.693023681640625, 0.7577667236328125, 0.822509765625, 0.8872528076171875, 0.951995849609375, 1.0167388916015625, 1.08148193359375, 1.1462249755859375, 1.210968017578125, 1.2757110595703125, 1.3404541015625, 1.4051971435546875, 1.469940185546875, 1.5346832275390625, 1.59942626953125, 1.6641693115234375, 1.728912353515625, 1.7936553955078125, 1.8583984375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 4.0, 4.0, 6.0, 11.0, 7.0, 7.0, 15.0, 24.0, 15.0, 10.0, 26.0, 29.0, 29.0, 26.0, 29.0, 38.0, 46.0, 46.0, 46.0, 48.0, 45.0, 29.0, 37.0, 51.0, 42.0, 27.0, 44.0, 40.0, 19.0, 35.0, 32.0, 25.0, 16.0, 10.0, 20.0, 15.0, 17.0, 5.0, 9.0, 6.0, 6.0, 3.0, 4.0, 2.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.041015625, -1.972808837890625, -1.90460205078125, -1.836395263671875, -1.7681884765625, -1.699981689453125, -1.63177490234375, -1.563568115234375, -1.495361328125, -1.427154541015625, -1.35894775390625, -1.290740966796875, -1.2225341796875, -1.154327392578125, -1.08612060546875, -1.017913818359375, -0.94970703125, -0.881500244140625, -0.81329345703125, -0.745086669921875, -0.6768798828125, -0.608673095703125, -0.54046630859375, -0.472259521484375, -0.404052734375, -0.335845947265625, -0.26763916015625, -0.199432373046875, -0.1312255859375, -0.063018798828125, 0.00518798828125, 0.073394775390625, 0.1416015625, 0.209808349609375, 0.27801513671875, 0.346221923828125, 0.4144287109375, 0.482635498046875, 0.55084228515625, 0.619049072265625, 0.687255859375, 0.755462646484375, 0.82366943359375, 0.891876220703125, 0.9600830078125, 1.028289794921875, 1.09649658203125, 1.164703369140625, 1.23291015625, 1.301116943359375, 1.36932373046875, 1.437530517578125, 1.5057373046875, 1.573944091796875, 1.64215087890625, 1.710357666015625, 1.778564453125, 1.846771240234375, 1.91497802734375, 1.983184814453125, 2.0513916015625, 2.119598388671875, 2.18780517578125, 2.256011962890625, 2.32421875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 8.0, 10.0, 12.0, 12.0, 15.0, 22.0, 32.0, 43.0, 72.0, 86.0, 140.0, 191.0, 326.0, 567.0, 844.0, 1452.0, 2456.0, 4055.0, 7812.0, 16658.0, 42437.0, 161210.0, 629142.0, 116219.0, 34351.0, 14281.0, 6803.0, 3703.0, 2089.0, 1261.0, 745.0, 488.0, 352.0, 208.0, 141.0, 102.0, 74.0, 37.0, 27.0, 24.0, 17.0, 9.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.31689453125, -0.3076820373535156, -0.29846954345703125, -0.2892570495605469, -0.2800445556640625, -0.2708320617675781, -0.26161956787109375, -0.2524070739746094, -0.243194580078125, -0.23398208618164062, -0.22476959228515625, -0.21555709838867188, -0.2063446044921875, -0.19713211059570312, -0.18791961669921875, -0.17870712280273438, -0.16949462890625, -0.16028213500976562, -0.15106964111328125, -0.14185714721679688, -0.1326446533203125, -0.12343215942382812, -0.11421966552734375, -0.10500717163085938, -0.095794677734375, -0.08658218383789062, -0.07736968994140625, -0.06815719604492188, -0.0589447021484375, -0.049732208251953125, -0.04051971435546875, -0.031307220458984375, -0.0220947265625, -0.012882232666015625, -0.00366973876953125, 0.005542755126953125, 0.0147552490234375, 0.023967742919921875, 0.03318023681640625, 0.042392730712890625, 0.051605224609375, 0.060817718505859375, 0.07003021240234375, 0.07924270629882812, 0.0884552001953125, 0.09766769409179688, 0.10688018798828125, 0.11609268188476562, 0.12530517578125, 0.13451766967773438, 0.14373016357421875, 0.15294265747070312, 0.1621551513671875, 0.17136764526367188, 0.18058013916015625, 0.18979263305664062, 0.199005126953125, 0.20821762084960938, 0.21743011474609375, 0.22664260864257812, 0.2358551025390625, 0.24506759643554688, 0.25428009033203125, 0.2634925842285156, 0.272705078125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 12.0, 9.0, 14.0, 19.0, 40.0, 37.0, 53.0, 102.0, 145.0, 183.0, 121.0, 79.0, 36.0, 39.0, 24.0, 20.0, 9.0, 8.0, 7.0, 8.0, 3.0, 1.0, 3.0, 7.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6345252990722656e-05, -2.5527551770210266e-05, -2.4709850549697876e-05, -2.3892149329185486e-05, -2.3074448108673096e-05, -2.2256746888160706e-05, -2.1439045667648315e-05, -2.0621344447135925e-05, -1.9803643226623535e-05, -1.8985942006111145e-05, -1.8168240785598755e-05, -1.7350539565086365e-05, -1.6532838344573975e-05, -1.5715137124061584e-05, -1.4897435903549194e-05, -1.4079734683036804e-05, -1.3262033462524414e-05, -1.2444332242012024e-05, -1.1626631021499634e-05, -1.0808929800987244e-05, -9.991228580474854e-06, -9.173527359962463e-06, -8.355826139450073e-06, -7.538124918937683e-06, -6.720423698425293e-06, -5.902722477912903e-06, -5.085021257400513e-06, -4.2673200368881226e-06, -3.4496188163757324e-06, -2.6319175958633423e-06, -1.8142163753509521e-06, -9.96515154838562e-07, -1.7881393432617188e-07, 6.388872861862183e-07, 1.4565885066986084e-06, 2.2742897272109985e-06, 3.0919909477233887e-06, 3.909692168235779e-06, 4.727393388748169e-06, 5.545094609260559e-06, 6.362795829772949e-06, 7.180497050285339e-06, 7.99819827079773e-06, 8.81589949131012e-06, 9.63360071182251e-06, 1.04513019323349e-05, 1.126900315284729e-05, 1.208670437335968e-05, 1.290440559387207e-05, 1.372210681438446e-05, 1.453980803489685e-05, 1.535750925540924e-05, 1.617521047592163e-05, 1.699291169643402e-05, 1.781061291694641e-05, 1.86283141374588e-05, 1.944601535797119e-05, 2.026371657848358e-05, 2.108141779899597e-05, 2.1899119019508362e-05, 2.2716820240020752e-05, 2.3534521460533142e-05, 2.4352222681045532e-05, 2.5169923901557922e-05, 2.5987625122070312e-05]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 2.0, 6.0, 7.0, 4.0, 11.0, 18.0, 30.0, 49.0, 71.0, 106.0, 164.0, 273.0, 483.0, 851.0, 1541.0, 2861.0, 5088.0, 9396.0, 17886.0, 37907.0, 98532.0, 522097.0, 227614.0, 65312.0, 27989.0, 13662.0, 7371.0, 4082.0, 2188.0, 1212.0, 698.0, 440.0, 238.0, 128.0, 80.0, 53.0, 41.0, 22.0, 13.0, 11.0, 8.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.5078125, -0.49279022216796875, -0.4777679443359375, -0.46274566650390625, -0.447723388671875, -0.43270111083984375, -0.4176788330078125, -0.40265655517578125, -0.38763427734375, -0.37261199951171875, -0.3575897216796875, -0.34256744384765625, -0.327545166015625, -0.31252288818359375, -0.2975006103515625, -0.28247833251953125, -0.2674560546875, -0.25243377685546875, -0.2374114990234375, -0.22238922119140625, -0.207366943359375, -0.19234466552734375, -0.1773223876953125, -0.16230010986328125, -0.14727783203125, -0.13225555419921875, -0.1172332763671875, -0.10221099853515625, -0.087188720703125, -0.07216644287109375, -0.0571441650390625, -0.04212188720703125, -0.027099609375, -0.01207733154296875, 0.0029449462890625, 0.01796722412109375, 0.032989501953125, 0.04801177978515625, 0.0630340576171875, 0.07805633544921875, 0.09307861328125, 0.10810089111328125, 0.1231231689453125, 0.13814544677734375, 0.153167724609375, 0.16819000244140625, 0.1832122802734375, 0.19823455810546875, 0.2132568359375, 0.22827911376953125, 0.2433013916015625, 0.25832366943359375, 0.273345947265625, 0.28836822509765625, 0.3033905029296875, 0.31841278076171875, 0.33343505859375, 0.34845733642578125, 0.3634796142578125, 0.37850189208984375, 0.393524169921875, 0.40854644775390625, 0.4235687255859375, 0.43859100341796875, 0.45361328125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 1.0, 4.0, 9.0, 9.0, 12.0, 7.0, 12.0, 6.0, 9.0, 20.0, 19.0, 28.0, 35.0, 32.0, 41.0, 43.0, 42.0, 64.0, 77.0, 87.0, 91.0, 65.0, 38.0, 45.0, 31.0, 40.0, 9.0, 18.0, 19.0, 21.0, 15.0, 17.0, 10.0, 8.0, 7.0, 8.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08380126953125, -0.08025455474853516, -0.07670783996582031, -0.07316112518310547, -0.06961441040039062, -0.06606769561767578, -0.06252098083496094, -0.058974266052246094, -0.05542755126953125, -0.051880836486816406, -0.04833412170410156, -0.04478740692138672, -0.041240692138671875, -0.03769397735595703, -0.03414726257324219, -0.030600547790527344, -0.0270538330078125, -0.023507118225097656, -0.019960403442382812, -0.01641368865966797, -0.012866973876953125, -0.009320259094238281, -0.0057735443115234375, -0.0022268295288085938, 0.00131988525390625, 0.004866600036621094, 0.008413314819335938, 0.011960029602050781, 0.015506744384765625, 0.01905345916748047, 0.022600173950195312, 0.026146888732910156, 0.029693603515625, 0.033240318298339844, 0.03678703308105469, 0.04033374786376953, 0.043880462646484375, 0.04742717742919922, 0.05097389221191406, 0.054520606994628906, 0.05806732177734375, 0.061614036560058594, 0.06516075134277344, 0.06870746612548828, 0.07225418090820312, 0.07580089569091797, 0.07934761047363281, 0.08289432525634766, 0.0864410400390625, 0.08998775482177734, 0.09353446960449219, 0.09708118438720703, 0.10062789916992188, 0.10417461395263672, 0.10772132873535156, 0.1112680435180664, 0.11481475830078125, 0.1183614730834961, 0.12190818786621094, 0.12545490264892578, 0.12900161743164062, 0.13254833221435547, 0.1360950469970703, 0.13964176177978516, 0.1431884765625]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 7.0, 8.0, 12.0, 24.0, 26.0, 56.0, 46.0, 102.0, 149.0, 153.0, 154.0, 79.0, 64.0, 39.0, 17.0, 17.0, 13.0, 8.0, 7.0, 5.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.93741512298584, -9.71297550201416, -9.48853588104248, -9.2640962600708, -9.039657592773438, -8.815217971801758, -8.590778350830078, -8.366338729858398, -8.141899108886719, -7.917459487915039, -7.693020343780518, -7.468580722808838, -7.244141101837158, -7.019701957702637, -6.795262336730957, -6.570822715759277, -6.346383094787598, -6.121943473815918, -5.8975043296813965, -5.673064708709717, -5.448625087738037, -5.224185943603516, -4.999746322631836, -4.775306701660156, -4.550867557525635, -4.326427936553955, -4.101988792419434, -3.877549171447754, -3.653109550476074, -3.4286701679229736, -3.204230785369873, -2.9797911643981934, -2.7553515434265137, -2.530912160873413, -2.3064725399017334, -2.082033157348633, -1.8575935363769531, -1.6331541538238525, -1.4087146520614624, -1.1842751502990723, -0.9598356485366821, -0.735396146774292, -0.5109566450119019, -0.2865172028541565, -0.06207770109176636, 0.162361741065979, 0.38680124282836914, 0.6112407445907593, 0.8356802463531494, 1.0601197481155396, 1.2845592498779297, 1.5089986324310303, 1.73343825340271, 1.9578776359558105, 2.1823172569274902, 2.406756639480591, 2.6311960220336914, 2.855635404586792, 3.0800750255584717, 3.3045144081115723, 3.528954029083252, 3.7533934116363525, 3.977832794189453, 4.202272415161133, 4.4267120361328125]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 6.0, 5.0, 6.0, 5.0, 8.0, 10.0, 9.0, 25.0, 22.0, 12.0, 18.0, 19.0, 23.0, 24.0, 32.0, 39.0, 33.0, 25.0, 35.0, 34.0, 38.0, 38.0, 41.0, 37.0, 28.0, 36.0, 38.0, 41.0, 36.0, 33.0, 28.0, 26.0, 30.0, 21.0, 23.0, 17.0, 16.0, 20.0, 13.0, 10.0, 7.0, 11.0, 6.0, 7.0, 4.0, 4.0, 2.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-2.96915602684021, -2.8762667179107666, -2.7833776473999023, -2.690488338470459, -2.5975990295410156, -2.5047097206115723, -2.411820411682129, -2.3189313411712646, -2.2260420322418213, -2.133152723312378, -2.0402636528015137, -1.9473743438720703, -1.854485034942627, -1.7615957260131836, -1.6687065362930298, -1.575817346572876, -1.4829280376434326, -1.3900387287139893, -1.2971495389938354, -1.2042603492736816, -1.1113710403442383, -1.018481731414795, -0.9255925416946411, -0.8327032923698425, -0.739814043045044, -0.6469247937202454, -0.5540355443954468, -0.4611462950706482, -0.3682570457458496, -0.275367796421051, -0.18247854709625244, -0.08958929777145386, 0.0032999515533447266, 0.09618920087814331, 0.1890784502029419, 0.2819676995277405, 0.37485694885253906, 0.46774619817733765, 0.5606354475021362, 0.6535246968269348, 0.7464139461517334, 0.839303195476532, 0.9321924448013306, 1.0250816345214844, 1.1179709434509277, 1.210860252380371, 1.303749442100525, 1.3966386318206787, 1.489527940750122, 1.5824172496795654, 1.6753064393997192, 1.768195629119873, 1.8610849380493164, 1.9539742469787598, 2.046863555908203, 2.1397526264190674, 2.2326419353485107, 2.325531244277954, 2.4184203147888184, 2.5113096237182617, 2.604198932647705, 2.6970882415771484, 2.789977550506592, 2.882866621017456, 2.9757559299468994]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 6.0, 5.0, 7.0, 9.0, 16.0, 16.0, 19.0, 39.0, 53.0, 74.0, 106.0, 154.0, 258.0, 380.0, 559.0, 840.0, 1461.0, 2319.0, 3978.0, 6399.0, 11088.0, 19981.0, 36410.0, 68311.0, 134439.0, 253993.0, 240224.0, 124301.0, 64016.0, 33912.0, 18593.0, 10594.0, 6149.0, 3692.0, 2280.0, 1359.0, 853.0, 548.0, 373.0, 255.0, 156.0, 112.0, 75.0, 55.0, 34.0, 20.0, 9.0, 16.0, 7.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0], "bins": [-6.234375, -6.05596923828125, -5.8775634765625, -5.69915771484375, -5.520751953125, -5.34234619140625, -5.1639404296875, -4.98553466796875, -4.80712890625, -4.62872314453125, -4.4503173828125, -4.27191162109375, -4.093505859375, -3.91510009765625, -3.7366943359375, -3.55828857421875, -3.3798828125, -3.20147705078125, -3.0230712890625, -2.84466552734375, -2.666259765625, -2.48785400390625, -2.3094482421875, -2.13104248046875, -1.95263671875, -1.77423095703125, -1.5958251953125, -1.41741943359375, -1.239013671875, -1.06060791015625, -0.8822021484375, -0.70379638671875, -0.525390625, -0.34698486328125, -0.1685791015625, 0.00982666015625, 0.188232421875, 0.36663818359375, 0.5450439453125, 0.72344970703125, 0.90185546875, 1.08026123046875, 1.2586669921875, 1.43707275390625, 1.615478515625, 1.79388427734375, 1.9722900390625, 2.15069580078125, 2.3291015625, 2.50750732421875, 2.6859130859375, 2.86431884765625, 3.042724609375, 3.22113037109375, 3.3995361328125, 3.57794189453125, 3.75634765625, 3.93475341796875, 4.1131591796875, 4.29156494140625, 4.469970703125, 4.64837646484375, 4.8267822265625, 5.00518798828125, 5.18359375]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 12.0, 6.0, 6.0, 12.0, 11.0, 21.0, 15.0, 19.0, 21.0, 21.0, 30.0, 32.0, 48.0, 29.0, 46.0, 44.0, 44.0, 36.0, 35.0, 44.0, 44.0, 36.0, 41.0, 49.0, 37.0, 46.0, 24.0, 32.0, 25.0, 14.0, 22.0, 18.0, 22.0, 11.0, 9.0, 8.0, 9.0, 5.0, 4.0, 5.0, 3.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0, -2.903656005859375, -2.80731201171875, -2.710968017578125, -2.6146240234375, -2.518280029296875, -2.42193603515625, -2.325592041015625, -2.229248046875, -2.132904052734375, -2.03656005859375, -1.940216064453125, -1.8438720703125, -1.747528076171875, -1.65118408203125, -1.554840087890625, -1.45849609375, -1.362152099609375, -1.26580810546875, -1.169464111328125, -1.0731201171875, -0.976776123046875, -0.88043212890625, -0.784088134765625, -0.687744140625, -0.591400146484375, -0.49505615234375, -0.398712158203125, -0.3023681640625, -0.206024169921875, -0.10968017578125, -0.013336181640625, 0.0830078125, 0.179351806640625, 0.27569580078125, 0.372039794921875, 0.4683837890625, 0.564727783203125, 0.66107177734375, 0.757415771484375, 0.853759765625, 0.950103759765625, 1.04644775390625, 1.142791748046875, 1.2391357421875, 1.335479736328125, 1.43182373046875, 1.528167724609375, 1.62451171875, 1.720855712890625, 1.81719970703125, 1.913543701171875, 2.0098876953125, 2.106231689453125, 2.20257568359375, 2.298919677734375, 2.395263671875, 2.491607666015625, 2.58795166015625, 2.684295654296875, 2.7806396484375, 2.876983642578125, 2.97332763671875, 3.069671630859375, 3.166015625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 10.0, 5.0, 10.0, 12.0, 31.0, 46.0, 33.0, 60.0, 82.0, 138.0, 226.0, 298.0, 454.0, 628.0, 989.0, 1676.0, 2658.0, 4356.0, 7040.0, 11881.0, 20227.0, 35476.0, 61724.0, 110974.0, 200818.0, 249800.0, 146743.0, 81062.0, 46098.0, 26206.0, 15211.0, 8928.0, 5489.0, 3335.0, 2000.0, 1326.0, 836.0, 571.0, 321.0, 252.0, 180.0, 105.0, 72.0, 56.0, 30.0, 24.0, 18.0, 14.0, 12.0, 8.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0], "bins": [-5.203125, -5.04656982421875, -4.8900146484375, -4.73345947265625, -4.576904296875, -4.42034912109375, -4.2637939453125, -4.10723876953125, -3.95068359375, -3.79412841796875, -3.6375732421875, -3.48101806640625, -3.324462890625, -3.16790771484375, -3.0113525390625, -2.85479736328125, -2.6982421875, -2.54168701171875, -2.3851318359375, -2.22857666015625, -2.072021484375, -1.91546630859375, -1.7589111328125, -1.60235595703125, -1.44580078125, -1.28924560546875, -1.1326904296875, -0.97613525390625, -0.819580078125, -0.66302490234375, -0.5064697265625, -0.34991455078125, -0.193359375, -0.03680419921875, 0.1197509765625, 0.27630615234375, 0.432861328125, 0.58941650390625, 0.7459716796875, 0.90252685546875, 1.05908203125, 1.21563720703125, 1.3721923828125, 1.52874755859375, 1.685302734375, 1.84185791015625, 1.9984130859375, 2.15496826171875, 2.3115234375, 2.46807861328125, 2.6246337890625, 2.78118896484375, 2.937744140625, 3.09429931640625, 3.2508544921875, 3.40740966796875, 3.56396484375, 3.72052001953125, 3.8770751953125, 4.03363037109375, 4.190185546875, 4.34674072265625, 4.5032958984375, 4.65985107421875, 4.81640625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 5.0, 11.0, 8.0, 9.0, 6.0, 10.0, 11.0, 7.0, 19.0, 32.0, 23.0, 18.0, 20.0, 34.0, 26.0, 38.0, 31.0, 38.0, 26.0, 42.0, 33.0, 49.0, 42.0, 30.0, 35.0, 45.0, 28.0, 33.0, 34.0, 36.0, 27.0, 37.0, 22.0, 15.0, 24.0, 22.0, 12.0, 8.0, 8.0, 8.0, 10.0, 5.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 6.0], "bins": [-1.79296875, -1.7382965087890625, -1.683624267578125, -1.6289520263671875, -1.57427978515625, -1.5196075439453125, -1.464935302734375, -1.4102630615234375, -1.3555908203125, -1.3009185791015625, -1.246246337890625, -1.1915740966796875, -1.13690185546875, -1.0822296142578125, -1.027557373046875, -0.9728851318359375, -0.918212890625, -0.8635406494140625, -0.808868408203125, -0.7541961669921875, -0.69952392578125, -0.6448516845703125, -0.590179443359375, -0.5355072021484375, -0.4808349609375, -0.4261627197265625, -0.371490478515625, -0.3168182373046875, -0.26214599609375, -0.2074737548828125, -0.152801513671875, -0.0981292724609375, -0.04345703125, 0.0112152099609375, 0.065887451171875, 0.1205596923828125, 0.17523193359375, 0.2299041748046875, 0.284576416015625, 0.3392486572265625, 0.3939208984375, 0.4485931396484375, 0.503265380859375, 0.5579376220703125, 0.61260986328125, 0.6672821044921875, 0.721954345703125, 0.7766265869140625, 0.831298828125, 0.8859710693359375, 0.940643310546875, 0.9953155517578125, 1.04998779296875, 1.1046600341796875, 1.159332275390625, 1.2140045166015625, 1.2686767578125, 1.3233489990234375, 1.378021240234375, 1.4326934814453125, 1.48736572265625, 1.5420379638671875, 1.596710205078125, 1.6513824462890625, 1.7060546875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 7.0, 6.0, 12.0, 18.0, 17.0, 27.0, 39.0, 54.0, 72.0, 122.0, 148.0, 206.0, 271.0, 391.0, 657.0, 884.0, 1338.0, 2159.0, 3278.0, 5561.0, 9451.0, 17836.0, 37088.0, 96505.0, 648237.0, 130004.0, 45347.0, 20863.0, 11011.0, 6139.0, 3675.0, 2415.0, 1486.0, 995.0, 654.0, 504.0, 322.0, 215.0, 157.0, 123.0, 85.0, 58.0, 37.0, 22.0, 23.0, 13.0, 12.0, 8.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.88671875, -4.72711181640625, -4.5675048828125, -4.40789794921875, -4.248291015625, -4.08868408203125, -3.9290771484375, -3.76947021484375, -3.60986328125, -3.45025634765625, -3.2906494140625, -3.13104248046875, -2.971435546875, -2.81182861328125, -2.6522216796875, -2.49261474609375, -2.3330078125, -2.17340087890625, -2.0137939453125, -1.85418701171875, -1.694580078125, -1.53497314453125, -1.3753662109375, -1.21575927734375, -1.05615234375, -0.89654541015625, -0.7369384765625, -0.57733154296875, -0.417724609375, -0.25811767578125, -0.0985107421875, 0.06109619140625, 0.220703125, 0.38031005859375, 0.5399169921875, 0.69952392578125, 0.859130859375, 1.01873779296875, 1.1783447265625, 1.33795166015625, 1.49755859375, 1.65716552734375, 1.8167724609375, 1.97637939453125, 2.135986328125, 2.29559326171875, 2.4552001953125, 2.61480712890625, 2.7744140625, 2.93402099609375, 3.0936279296875, 3.25323486328125, 3.412841796875, 3.57244873046875, 3.7320556640625, 3.89166259765625, 4.05126953125, 4.21087646484375, 4.3704833984375, 4.53009033203125, 4.689697265625, 4.84930419921875, 5.0089111328125, 5.16851806640625, 5.328125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 3.0, 4.0, 7.0, 5.0, 9.0, 10.0, 15.0, 26.0, 38.0, 56.0, 100.0, 397.0, 137.0, 66.0, 39.0, 27.0, 17.0, 17.0, 5.0, 8.0, 7.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00034618377685546875, -0.0003352165222167969, -0.000324249267578125, -0.0003132820129394531, -0.00030231475830078125, -0.0002913475036621094, -0.0002803802490234375, -0.0002694129943847656, -0.00025844573974609375, -0.0002474784851074219, -0.00023651123046875, -0.00022554397583007812, -0.00021457672119140625, -0.00020360946655273438, -0.0001926422119140625, -0.00018167495727539062, -0.00017070770263671875, -0.00015974044799804688, -0.000148773193359375, -0.00013780593872070312, -0.00012683868408203125, -0.00011587142944335938, -0.0001049041748046875, -9.393692016601562e-05, -8.296966552734375e-05, -7.200241088867188e-05, -6.103515625e-05, -5.0067901611328125e-05, -3.910064697265625e-05, -2.8133392333984375e-05, -1.71661376953125e-05, -6.198883056640625e-06, 4.76837158203125e-06, 1.5735626220703125e-05, 2.6702880859375e-05, 3.7670135498046875e-05, 4.863739013671875e-05, 5.9604644775390625e-05, 7.05718994140625e-05, 8.153915405273438e-05, 9.250640869140625e-05, 0.00010347366333007812, 0.00011444091796875, 0.00012540817260742188, 0.00013637542724609375, 0.00014734268188476562, 0.0001583099365234375, 0.00016927719116210938, 0.00018024444580078125, 0.00019121170043945312, 0.000202178955078125, 0.00021314620971679688, 0.00022411346435546875, 0.00023508071899414062, 0.0002460479736328125, 0.0002570152282714844, 0.00026798248291015625, 0.0002789497375488281, 0.0002899169921875, 0.0003008842468261719, 0.00031185150146484375, 0.0003228187561035156, 0.0003337860107421875, 0.0003447532653808594, 0.00035572052001953125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 6.0, 10.0, 6.0, 12.0, 14.0, 21.0, 30.0, 44.0, 74.0, 103.0, 141.0, 198.0, 288.0, 462.0, 707.0, 1140.0, 1588.0, 2689.0, 4835.0, 8823.0, 17531.0, 39573.0, 126471.0, 688538.0, 90180.0, 32020.0, 14555.0, 7597.0, 4094.0, 2436.0, 1445.0, 975.0, 637.0, 414.0, 285.0, 179.0, 135.0, 87.0, 59.0, 43.0, 39.0, 28.0, 18.0, 9.0, 4.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-5.52734375, -5.36175537109375, -5.1961669921875, -5.03057861328125, -4.864990234375, -4.69940185546875, -4.5338134765625, -4.36822509765625, -4.20263671875, -4.03704833984375, -3.8714599609375, -3.70587158203125, -3.540283203125, -3.37469482421875, -3.2091064453125, -3.04351806640625, -2.8779296875, -2.71234130859375, -2.5467529296875, -2.38116455078125, -2.215576171875, -2.04998779296875, -1.8843994140625, -1.71881103515625, -1.55322265625, -1.38763427734375, -1.2220458984375, -1.05645751953125, -0.890869140625, -0.72528076171875, -0.5596923828125, -0.39410400390625, -0.228515625, -0.06292724609375, 0.1026611328125, 0.26824951171875, 0.433837890625, 0.59942626953125, 0.7650146484375, 0.93060302734375, 1.09619140625, 1.26177978515625, 1.4273681640625, 1.59295654296875, 1.758544921875, 1.92413330078125, 2.0897216796875, 2.25531005859375, 2.4208984375, 2.58648681640625, 2.7520751953125, 2.91766357421875, 3.083251953125, 3.24884033203125, 3.4144287109375, 3.58001708984375, 3.74560546875, 3.91119384765625, 4.0767822265625, 4.24237060546875, 4.407958984375, 4.57354736328125, 4.7391357421875, 4.90472412109375, 5.0703125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 0.0, 6.0, 4.0, 2.0, 3.0, 9.0, 15.0, 13.0, 15.0, 14.0, 22.0, 19.0, 36.0, 34.0, 51.0, 104.0, 309.0, 81.0, 57.0, 51.0, 35.0, 23.0, 25.0, 21.0, 9.0, 11.0, 6.0, 6.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2412109375, -1.197479248046875, -1.15374755859375, -1.110015869140625, -1.0662841796875, -1.022552490234375, -0.97882080078125, -0.935089111328125, -0.891357421875, -0.847625732421875, -0.80389404296875, -0.760162353515625, -0.7164306640625, -0.672698974609375, -0.62896728515625, -0.585235595703125, -0.54150390625, -0.497772216796875, -0.45404052734375, -0.410308837890625, -0.3665771484375, -0.322845458984375, -0.27911376953125, -0.235382080078125, -0.191650390625, -0.147918701171875, -0.10418701171875, -0.060455322265625, -0.0167236328125, 0.027008056640625, 0.07073974609375, 0.114471435546875, 0.158203125, 0.201934814453125, 0.24566650390625, 0.289398193359375, 0.3331298828125, 0.376861572265625, 0.42059326171875, 0.464324951171875, 0.508056640625, 0.551788330078125, 0.59552001953125, 0.639251708984375, 0.6829833984375, 0.726715087890625, 0.77044677734375, 0.814178466796875, 0.85791015625, 0.901641845703125, 0.94537353515625, 0.989105224609375, 1.0328369140625, 1.076568603515625, 1.12030029296875, 1.164031982421875, 1.207763671875, 1.251495361328125, 1.29522705078125, 1.338958740234375, 1.3826904296875, 1.426422119140625, 1.47015380859375, 1.513885498046875, 1.5576171875]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 12.0, 13.0, 24.0, 34.0, 42.0, 57.0, 96.0, 147.0, 150.0, 117.0, 79.0, 71.0, 50.0, 27.0, 30.0, 11.0, 15.0, 9.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0], "bins": [-9.411670684814453, -9.208216667175293, -9.004762649536133, -8.801308631896973, -8.597854614257812, -8.394400596618652, -8.190946578979492, -7.987492084503174, -7.784038066864014, -7.5805840492248535, -7.377130031585693, -7.173676013946533, -6.970221996307373, -6.766767501831055, -6.5633134841918945, -6.359859466552734, -6.156405448913574, -5.952951431274414, -5.749497413635254, -5.546043395996094, -5.342589378356934, -5.139135360717773, -4.935681343078613, -4.732226848602295, -4.528773307800293, -4.325319290161133, -4.121865272521973, -3.9184112548828125, -3.7149569988250732, -3.511502981185913, -3.308048963546753, -3.1045947074890137, -2.9011404514312744, -2.6976864337921143, -2.494232416152954, -2.290778160095215, -2.0873241424560547, -1.8838701248168945, -1.6804161071777344, -1.4769619703292847, -1.2735079526901245, -1.0700539350509644, -0.8665997982025146, -0.6631457805633545, -0.45969170331954956, -0.25623762607574463, -0.05278360843658447, 0.15067052841186523, 0.3541245460510254, 0.5575786232948303, 0.7610327005386353, 0.9644867181777954, 1.1679408550262451, 1.3713948726654053, 1.5748488903045654, 1.7783030271530151, 1.9817570447921753, 2.185211181640625, 2.388665199279785, 2.5921192169189453, 2.7955732345581055, 2.9990272521972656, 3.202481269836426, 3.405935525894165, 3.609389543533325]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 7.0, 4.0, 3.0, 4.0, 6.0, 12.0, 7.0, 6.0, 12.0, 15.0, 19.0, 26.0, 18.0, 29.0, 31.0, 22.0, 32.0, 26.0, 26.0, 39.0, 26.0, 27.0, 43.0, 38.0, 36.0, 37.0, 42.0, 35.0, 36.0, 39.0, 35.0, 31.0, 26.0, 25.0, 16.0, 24.0, 23.0, 18.0, 19.0, 14.0, 11.0, 11.0, 10.0, 7.0, 11.0, 5.0, 3.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0], "bins": [-2.6638567447662354, -2.5786540508270264, -2.4934515953063965, -2.4082489013671875, -2.3230464458465576, -2.2378437519073486, -2.1526412963867188, -2.0674386024475098, -1.9822360277175903, -1.897033452987671, -1.8118308782577515, -1.726628303527832, -1.641425609588623, -1.5562231540679932, -1.4710204601287842, -1.3858178853988647, -1.3006153106689453, -1.2154127359390259, -1.1302101612091064, -1.0450074672698975, -0.9598049521446228, -0.8746023774147034, -0.7893997430801392, -0.7041971683502197, -0.6189945936203003, -0.5337920188903809, -0.44858941435813904, -0.3633868098258972, -0.2781842350959778, -0.19298166036605835, -0.10777902603149414, -0.022576451301574707, 0.06262612342834473, 0.14782871305942535, 0.23303130269050598, 0.3182339072227478, 0.40343648195266724, 0.48863905668258667, 0.5738416910171509, 0.6590442657470703, 0.7442468404769897, 0.8294494152069092, 0.9146519899368286, 0.9998546242713928, 1.085057258605957, 1.170259714126587, 1.255462408065796, 1.3406649827957153, 1.4258675575256348, 1.5110701322555542, 1.5962727069854736, 1.6814754009246826, 1.7666778564453125, 1.8518805503845215, 1.937083125114441, 2.0222856998443604, 2.1074881553649902, 2.192690849304199, 2.277893304824829, 2.363095998764038, 2.448298454284668, 2.533501148223877, 2.618703842163086, 2.703906297683716, 2.789108991622925]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 12.0, 20.0, 26.0, 47.0, 57.0, 60.0, 74.0, 135.0, 195.0, 295.0, 446.0, 658.0, 965.0, 1477.0, 2293.0, 3549.0, 5511.0, 8799.0, 14084.0, 23484.0, 40561.0, 75112.0, 150195.0, 371074.0, 1432388.0, 1381582.0, 361884.0, 146610.0, 73168.0, 39389.0, 22776.0, 13606.0, 8379.0, 5233.0, 3391.0, 2184.0, 1469.0, 1004.0, 633.0, 430.0, 310.0, 196.0, 156.0, 116.0, 73.0, 55.0, 38.0, 23.0, 21.0, 16.0, 9.0, 8.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.296875, -4.158203125, -4.01953125, -3.880859375, -3.7421875, -3.603515625, -3.46484375, -3.326171875, -3.1875, -3.048828125, -2.91015625, -2.771484375, -2.6328125, -2.494140625, -2.35546875, -2.216796875, -2.078125, -1.939453125, -1.80078125, -1.662109375, -1.5234375, -1.384765625, -1.24609375, -1.107421875, -0.96875, -0.830078125, -0.69140625, -0.552734375, -0.4140625, -0.275390625, -0.13671875, 0.001953125, 0.140625, 0.279296875, 0.41796875, 0.556640625, 0.6953125, 0.833984375, 0.97265625, 1.111328125, 1.25, 1.388671875, 1.52734375, 1.666015625, 1.8046875, 1.943359375, 2.08203125, 2.220703125, 2.359375, 2.498046875, 2.63671875, 2.775390625, 2.9140625, 3.052734375, 3.19140625, 3.330078125, 3.46875, 3.607421875, 3.74609375, 3.884765625, 4.0234375, 4.162109375, 4.30078125, 4.439453125, 4.578125]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 1.0, 4.0, 6.0, 6.0, 7.0, 11.0, 7.0, 12.0, 15.0, 20.0, 22.0, 31.0, 33.0, 25.0, 38.0, 30.0, 31.0, 35.0, 41.0, 33.0, 27.0, 35.0, 38.0, 46.0, 54.0, 34.0, 31.0, 48.0, 39.0, 22.0, 32.0, 27.0, 21.0, 20.0, 13.0, 21.0, 9.0, 15.0, 12.0, 11.0, 8.0, 4.0, 5.0, 5.0, 4.0, 4.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.845703125, -1.7869110107421875, -1.728118896484375, -1.6693267822265625, -1.61053466796875, -1.5517425537109375, -1.492950439453125, -1.4341583251953125, -1.3753662109375, -1.3165740966796875, -1.257781982421875, -1.1989898681640625, -1.14019775390625, -1.0814056396484375, -1.022613525390625, -0.9638214111328125, -0.905029296875, -0.8462371826171875, -0.787445068359375, -0.7286529541015625, -0.66986083984375, -0.6110687255859375, -0.552276611328125, -0.4934844970703125, -0.4346923828125, -0.3759002685546875, -0.317108154296875, -0.2583160400390625, -0.19952392578125, -0.1407318115234375, -0.081939697265625, -0.0231475830078125, 0.03564453125, 0.0944366455078125, 0.153228759765625, 0.2120208740234375, 0.27081298828125, 0.3296051025390625, 0.388397216796875, 0.4471893310546875, 0.5059814453125, 0.5647735595703125, 0.623565673828125, 0.6823577880859375, 0.74114990234375, 0.7999420166015625, 0.858734130859375, 0.9175262451171875, 0.976318359375, 1.0351104736328125, 1.093902587890625, 1.1526947021484375, 1.21148681640625, 1.2702789306640625, 1.329071044921875, 1.3878631591796875, 1.4466552734375, 1.5054473876953125, 1.564239501953125, 1.6230316162109375, 1.68182373046875, 1.7406158447265625, 1.799407958984375, 1.8582000732421875, 1.9169921875]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 6.0, 16.0, 11.0, 17.0, 29.0, 44.0, 68.0, 98.0, 175.0, 246.0, 364.0, 575.0, 879.0, 1319.0, 2081.0, 3347.0, 5685.0, 9106.0, 15484.0, 26951.0, 48287.0, 92557.0, 189984.0, 445238.0, 1362015.0, 1213181.0, 405367.0, 175910.0, 86265.0, 45843.0, 25510.0, 14597.0, 8842.0, 5300.0, 3156.0, 2033.0, 1259.0, 850.0, 551.0, 319.0, 236.0, 153.0, 109.0, 59.0, 46.0, 42.0, 29.0, 18.0, 6.0, 7.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 3.0], "bins": [-3.7421875, -3.62506103515625, -3.5079345703125, -3.39080810546875, -3.273681640625, -3.15655517578125, -3.0394287109375, -2.92230224609375, -2.80517578125, -2.68804931640625, -2.5709228515625, -2.45379638671875, -2.336669921875, -2.21954345703125, -2.1024169921875, -1.98529052734375, -1.8681640625, -1.75103759765625, -1.6339111328125, -1.51678466796875, -1.399658203125, -1.28253173828125, -1.1654052734375, -1.04827880859375, -0.93115234375, -0.81402587890625, -0.6968994140625, -0.57977294921875, -0.462646484375, -0.34552001953125, -0.2283935546875, -0.11126708984375, 0.005859375, 0.12298583984375, 0.2401123046875, 0.35723876953125, 0.474365234375, 0.59149169921875, 0.7086181640625, 0.82574462890625, 0.94287109375, 1.05999755859375, 1.1771240234375, 1.29425048828125, 1.411376953125, 1.52850341796875, 1.6456298828125, 1.76275634765625, 1.8798828125, 1.99700927734375, 2.1141357421875, 2.23126220703125, 2.348388671875, 2.46551513671875, 2.5826416015625, 2.69976806640625, 2.81689453125, 2.93402099609375, 3.0511474609375, 3.16827392578125, 3.285400390625, 3.40252685546875, 3.5196533203125, 3.63677978515625, 3.75390625]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 7.0, 15.0, 18.0, 18.0, 38.0, 33.0, 50.0, 77.0, 86.0, 95.0, 126.0, 161.0, 182.0, 241.0, 274.0, 341.0, 346.0, 353.0, 289.0, 247.0, 209.0, 187.0, 147.0, 121.0, 83.0, 77.0, 63.0, 54.0, 33.0, 25.0, 18.0, 17.0, 10.0, 13.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2568359375, -1.21746826171875, -1.1781005859375, -1.13873291015625, -1.099365234375, -1.05999755859375, -1.0206298828125, -0.98126220703125, -0.94189453125, -0.90252685546875, -0.8631591796875, -0.82379150390625, -0.784423828125, -0.74505615234375, -0.7056884765625, -0.66632080078125, -0.626953125, -0.58758544921875, -0.5482177734375, -0.50885009765625, -0.469482421875, -0.43011474609375, -0.3907470703125, -0.35137939453125, -0.31201171875, -0.27264404296875, -0.2332763671875, -0.19390869140625, -0.154541015625, -0.11517333984375, -0.0758056640625, -0.03643798828125, 0.0029296875, 0.04229736328125, 0.0816650390625, 0.12103271484375, 0.160400390625, 0.19976806640625, 0.2391357421875, 0.27850341796875, 0.31787109375, 0.35723876953125, 0.3966064453125, 0.43597412109375, 0.475341796875, 0.51470947265625, 0.5540771484375, 0.59344482421875, 0.6328125, 0.67218017578125, 0.7115478515625, 0.75091552734375, 0.790283203125, 0.82965087890625, 0.8690185546875, 0.90838623046875, 0.94775390625, 0.98712158203125, 1.0264892578125, 1.06585693359375, 1.105224609375, 1.14459228515625, 1.1839599609375, 1.22332763671875, 1.2626953125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 6.0, 5.0, 10.0, 8.0, 16.0, 14.0, 28.0, 24.0, 48.0, 85.0, 79.0, 102.0, 136.0, 107.0, 86.0, 71.0, 46.0, 49.0, 24.0, 11.0, 8.0, 15.0, 4.0, 4.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9193053245544434, -3.799006223678589, -3.6787068843841553, -3.558407783508301, -3.4381086826324463, -3.317809581756592, -3.197510242462158, -3.0772111415863037, -2.956912040710449, -2.8366129398345947, -2.716313600540161, -2.5960144996643066, -2.475715398788452, -2.3554162979125977, -2.235116958618164, -2.1148178577423096, -1.994518518447876, -1.874219298362732, -1.7539201974868774, -1.6336209774017334, -1.513321876525879, -1.3930226564407349, -1.2727234363555908, -1.1524243354797363, -1.0321251153945923, -0.911825954914093, -0.7915267944335938, -0.6712275743484497, -0.5509284138679504, -0.43062925338745117, -0.31033003330230713, -0.19003087282180786, -0.0697319507598877, 0.050567224621772766, 0.17086640000343323, 0.2911655902862549, 0.41146475076675415, 0.5317639112472534, 0.6520631313323975, 0.7723622918128967, 0.892661452293396, 1.01296067237854, 1.1332597732543945, 1.2535589933395386, 1.3738582134246826, 1.494157314300537, 1.6144565343856812, 1.7347557544708252, 1.8550548553466797, 1.9753540754318237, 2.0956532955169678, 2.2159523963928223, 2.3362514972686768, 2.4565505981445312, 2.576849937438965, 2.6971490383148193, 2.817448139190674, 2.9377472400665283, 3.058046579360962, 3.1783456802368164, 3.298644781112671, 3.4189438819885254, 3.539243221282959, 3.6595423221588135, 3.779841661453247]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 2.0, 7.0, 5.0, 8.0, 9.0, 10.0, 13.0, 21.0, 23.0, 27.0, 17.0, 23.0, 27.0, 20.0, 25.0, 31.0, 33.0, 32.0, 49.0, 36.0, 42.0, 39.0, 44.0, 43.0, 49.0, 26.0, 35.0, 32.0, 33.0, 24.0, 21.0, 26.0, 17.0, 22.0, 18.0, 15.0, 16.0, 14.0, 20.0, 7.0, 6.0, 8.0, 11.0, 4.0, 1.0, 3.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0], "bins": [-2.208970785140991, -2.144301176071167, -2.079631805419922, -2.0149621963500977, -1.950292706489563, -1.8856232166290283, -1.820953607559204, -1.7562841176986694, -1.6916146278381348, -1.6269451379776, -1.5622756481170654, -1.4976060390472412, -1.4329365491867065, -1.3682670593261719, -1.3035974502563477, -1.238927960395813, -1.1742584705352783, -1.1095889806747437, -1.044919490814209, -0.9802498817443848, -0.9155803918838501, -0.8509109020233154, -0.786241352558136, -0.7215718030929565, -0.6569023132324219, -0.5922328233718872, -0.5275632739067078, -0.4628937542438507, -0.39822423458099365, -0.3335547149181366, -0.26888519525527954, -0.20421567559242249, -0.13954615592956543, -0.07487663626670837, -0.010207116603851318, 0.05446240305900574, 0.11913192272186279, 0.18380144238471985, 0.2484709620475769, 0.31314048171043396, 0.377810001373291, 0.44247952103614807, 0.5071490406990051, 0.5718185901641846, 0.6364880800247192, 0.7011575698852539, 0.7658271193504333, 0.8304966688156128, 0.8951661586761475, 0.9598356485366821, 1.0245051383972168, 1.089174747467041, 1.1538442373275757, 1.2185137271881104, 1.2831833362579346, 1.3478528261184692, 1.412522315979004, 1.4771918058395386, 1.5418612957000732, 1.6065309047698975, 1.6712003946304321, 1.7358698844909668, 1.800539493560791, 1.8652089834213257, 1.9298784732818604]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 5.0, 12.0, 17.0, 22.0, 18.0, 49.0, 57.0, 79.0, 111.0, 165.0, 222.0, 321.0, 474.0, 702.0, 940.0, 1442.0, 2168.0, 3248.0, 5130.0, 7802.0, 12452.0, 20637.0, 34512.0, 60285.0, 113831.0, 243482.0, 261533.0, 120462.0, 64009.0, 36164.0, 21447.0, 12899.0, 8213.0, 5238.0, 3345.0, 2211.0, 1528.0, 1033.0, 715.0, 497.0, 314.0, 211.0, 178.0, 122.0, 86.0, 48.0, 32.0, 31.0, 15.0, 11.0, 10.0, 7.0, 12.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.68603515625, -0.6632003784179688, -0.6403656005859375, -0.6175308227539062, -0.594696044921875, -0.5718612670898438, -0.5490264892578125, -0.5261917114257812, -0.50335693359375, -0.48052215576171875, -0.4576873779296875, -0.43485260009765625, -0.412017822265625, -0.38918304443359375, -0.3663482666015625, -0.34351348876953125, -0.3206787109375, -0.29784393310546875, -0.2750091552734375, -0.25217437744140625, -0.229339599609375, -0.20650482177734375, -0.1836700439453125, -0.16083526611328125, -0.13800048828125, -0.11516571044921875, -0.0923309326171875, -0.06949615478515625, -0.046661376953125, -0.02382659912109375, -0.0009918212890625, 0.02184295654296875, 0.044677734375, 0.06751251220703125, 0.0903472900390625, 0.11318206787109375, 0.136016845703125, 0.15885162353515625, 0.1816864013671875, 0.20452117919921875, 0.22735595703125, 0.25019073486328125, 0.2730255126953125, 0.29586029052734375, 0.318695068359375, 0.34152984619140625, 0.3643646240234375, 0.38719940185546875, 0.4100341796875, 0.43286895751953125, 0.4557037353515625, 0.47853851318359375, 0.501373291015625, 0.5242080688476562, 0.5470428466796875, 0.5698776245117188, 0.59271240234375, 0.6155471801757812, 0.6383819580078125, 0.6612167358398438, 0.684051513671875, 0.7068862915039062, 0.7297210693359375, 0.7525558471679688, 0.775390625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 3.0, 6.0, 5.0, 5.0, 6.0, 11.0, 21.0, 18.0, 15.0, 19.0, 27.0, 24.0, 13.0, 24.0, 33.0, 33.0, 34.0, 33.0, 32.0, 38.0, 42.0, 46.0, 45.0, 39.0, 48.0, 29.0, 46.0, 32.0, 32.0, 17.0, 26.0, 31.0, 29.0, 17.0, 16.0, 12.0, 13.0, 16.0, 12.0, 15.0, 8.0, 5.0, 6.0, 8.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.21484375, -2.14825439453125, -2.0816650390625, -2.01507568359375, -1.948486328125, -1.88189697265625, -1.8153076171875, -1.74871826171875, -1.68212890625, -1.61553955078125, -1.5489501953125, -1.48236083984375, -1.415771484375, -1.34918212890625, -1.2825927734375, -1.21600341796875, -1.1494140625, -1.08282470703125, -1.0162353515625, -0.94964599609375, -0.883056640625, -0.81646728515625, -0.7498779296875, -0.68328857421875, -0.61669921875, -0.55010986328125, -0.4835205078125, -0.41693115234375, -0.350341796875, -0.28375244140625, -0.2171630859375, -0.15057373046875, -0.083984375, -0.01739501953125, 0.0491943359375, 0.11578369140625, 0.182373046875, 0.24896240234375, 0.3155517578125, 0.38214111328125, 0.44873046875, 0.51531982421875, 0.5819091796875, 0.64849853515625, 0.715087890625, 0.78167724609375, 0.8482666015625, 0.91485595703125, 0.9814453125, 1.04803466796875, 1.1146240234375, 1.18121337890625, 1.247802734375, 1.31439208984375, 1.3809814453125, 1.44757080078125, 1.51416015625, 1.58074951171875, 1.6473388671875, 1.71392822265625, 1.780517578125, 1.84710693359375, 1.9136962890625, 1.98028564453125, 2.046875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 3.0, 10.0, 19.0, 24.0, 26.0, 31.0, 43.0, 63.0, 100.0, 124.0, 190.0, 252.0, 399.0, 564.0, 909.0, 1362.0, 2216.0, 3551.0, 6148.0, 11072.0, 20968.0, 43916.0, 110464.0, 415644.0, 273133.0, 81758.0, 34891.0, 17409.0, 9310.0, 5214.0, 3098.0, 1938.0, 1209.0, 820.0, 525.0, 359.0, 261.0, 143.0, 112.0, 81.0, 65.0, 49.0, 20.0, 15.0, 17.0, 6.0, 6.0, 7.0, 7.0, 2.0, 1.0, 1.0, 0.0, 5.0], "bins": [-1.265625, -1.228240966796875, -1.19085693359375, -1.153472900390625, -1.1160888671875, -1.078704833984375, -1.04132080078125, -1.003936767578125, -0.966552734375, -0.929168701171875, -0.89178466796875, -0.854400634765625, -0.8170166015625, -0.779632568359375, -0.74224853515625, -0.704864501953125, -0.66748046875, -0.630096435546875, -0.59271240234375, -0.555328369140625, -0.5179443359375, -0.480560302734375, -0.44317626953125, -0.405792236328125, -0.368408203125, -0.331024169921875, -0.29364013671875, -0.256256103515625, -0.2188720703125, -0.181488037109375, -0.14410400390625, -0.106719970703125, -0.0693359375, -0.031951904296875, 0.00543212890625, 0.042816162109375, 0.0802001953125, 0.117584228515625, 0.15496826171875, 0.192352294921875, 0.229736328125, 0.267120361328125, 0.30450439453125, 0.341888427734375, 0.3792724609375, 0.416656494140625, 0.45404052734375, 0.491424560546875, 0.52880859375, 0.566192626953125, 0.60357666015625, 0.640960693359375, 0.6783447265625, 0.715728759765625, 0.75311279296875, 0.790496826171875, 0.827880859375, 0.865264892578125, 0.90264892578125, 0.940032958984375, 0.9774169921875, 1.014801025390625, 1.05218505859375, 1.089569091796875, 1.126953125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 3.0, 4.0, 6.0, 8.0, 11.0, 10.0, 21.0, 10.0, 11.0, 17.0, 27.0, 22.0, 21.0, 27.0, 34.0, 27.0, 28.0, 42.0, 46.0, 34.0, 46.0, 37.0, 39.0, 39.0, 38.0, 36.0, 47.0, 30.0, 38.0, 40.0, 25.0, 27.0, 23.0, 17.0, 19.0, 15.0, 14.0, 15.0, 13.0, 9.0, 9.0, 6.0, 3.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.3759765625, -1.331573486328125, -1.28717041015625, -1.242767333984375, -1.1983642578125, -1.153961181640625, -1.10955810546875, -1.065155029296875, -1.020751953125, -0.976348876953125, -0.93194580078125, -0.887542724609375, -0.8431396484375, -0.798736572265625, -0.75433349609375, -0.709930419921875, -0.66552734375, -0.621124267578125, -0.57672119140625, -0.532318115234375, -0.4879150390625, -0.443511962890625, -0.39910888671875, -0.354705810546875, -0.310302734375, -0.265899658203125, -0.22149658203125, -0.177093505859375, -0.1326904296875, -0.088287353515625, -0.04388427734375, 0.000518798828125, 0.044921875, 0.089324951171875, 0.13372802734375, 0.178131103515625, 0.2225341796875, 0.266937255859375, 0.31134033203125, 0.355743408203125, 0.400146484375, 0.444549560546875, 0.48895263671875, 0.533355712890625, 0.5777587890625, 0.622161865234375, 0.66656494140625, 0.710968017578125, 0.75537109375, 0.799774169921875, 0.84417724609375, 0.888580322265625, 0.9329833984375, 0.977386474609375, 1.02178955078125, 1.066192626953125, 1.110595703125, 1.154998779296875, 1.19940185546875, 1.243804931640625, 1.2882080078125, 1.332611083984375, 1.37701416015625, 1.421417236328125, 1.4658203125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 5.0, 8.0, 16.0, 19.0, 33.0, 41.0, 72.0, 91.0, 119.0, 154.0, 226.0, 350.0, 511.0, 715.0, 1032.0, 1560.0, 2529.0, 3821.0, 6013.0, 10301.0, 18095.0, 33848.0, 71623.0, 214423.0, 472581.0, 106897.0, 45774.0, 23368.0, 13184.0, 7647.0, 4709.0, 2931.0, 1976.0, 1205.0, 839.0, 553.0, 352.0, 269.0, 175.0, 137.0, 95.0, 74.0, 45.0, 19.0, 31.0, 19.0, 21.0, 14.0, 10.0, 6.0, 4.0, 2.0, 2.0, 6.0, 4.0, 1.0, 2.0], "bins": [-0.093505859375, -0.09051036834716797, -0.08751487731933594, -0.0845193862915039, -0.08152389526367188, -0.07852840423583984, -0.07553291320800781, -0.07253742218017578, -0.06954193115234375, -0.06654644012451172, -0.06355094909667969, -0.060555458068847656, -0.057559967041015625, -0.054564476013183594, -0.05156898498535156, -0.04857349395751953, -0.0455780029296875, -0.04258251190185547, -0.03958702087402344, -0.036591529846191406, -0.033596038818359375, -0.030600547790527344, -0.027605056762695312, -0.02460956573486328, -0.02161407470703125, -0.01861858367919922, -0.015623092651367188, -0.012627601623535156, -0.009632110595703125, -0.006636619567871094, -0.0036411285400390625, -0.0006456375122070312, 0.002349853515625, 0.005345344543457031, 0.008340835571289062, 0.011336326599121094, 0.014331817626953125, 0.017327308654785156, 0.020322799682617188, 0.02331829071044922, 0.02631378173828125, 0.02930927276611328, 0.03230476379394531, 0.035300254821777344, 0.038295745849609375, 0.041291236877441406, 0.04428672790527344, 0.04728221893310547, 0.0502777099609375, 0.05327320098876953, 0.05626869201660156, 0.059264183044433594, 0.062259674072265625, 0.06525516510009766, 0.06825065612792969, 0.07124614715576172, 0.07424163818359375, 0.07723712921142578, 0.08023262023925781, 0.08322811126708984, 0.08622360229492188, 0.0892190933227539, 0.09221458435058594, 0.09521007537841797, 0.09820556640625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 2.0, 5.0, 7.0, 8.0, 11.0, 13.0, 32.0, 15.0, 26.0, 39.0, 49.0, 50.0, 90.0, 96.0, 106.0, 94.0, 76.0, 68.0, 54.0, 35.0, 27.0, 17.0, 16.0, 13.0, 12.0, 7.0, 7.0, 7.0, 8.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.0609626770019531e-05, -1.0300427675247192e-05, -9.991228580474854e-06, -9.682029485702515e-06, -9.372830390930176e-06, -9.063631296157837e-06, -8.754432201385498e-06, -8.44523310661316e-06, -8.13603401184082e-06, -7.826834917068481e-06, -7.517635822296143e-06, -7.208436727523804e-06, -6.899237632751465e-06, -6.590038537979126e-06, -6.280839443206787e-06, -5.971640348434448e-06, -5.662441253662109e-06, -5.3532421588897705e-06, -5.044043064117432e-06, -4.734843969345093e-06, -4.425644874572754e-06, -4.116445779800415e-06, -3.807246685028076e-06, -3.4980475902557373e-06, -3.1888484954833984e-06, -2.8796494007110596e-06, -2.5704503059387207e-06, -2.261251211166382e-06, -1.952052116394043e-06, -1.642853021621704e-06, -1.3336539268493652e-06, -1.0244548320770264e-06, -7.152557373046875e-07, -4.0605664253234863e-07, -9.685754776000977e-08, 2.123415470123291e-07, 5.21540641784668e-07, 8.307397365570068e-07, 1.1399388313293457e-06, 1.4491379261016846e-06, 1.7583370208740234e-06, 2.0675361156463623e-06, 2.376735210418701e-06, 2.68593430519104e-06, 2.995133399963379e-06, 3.3043324947357178e-06, 3.6135315895080566e-06, 3.9227306842803955e-06, 4.231929779052734e-06, 4.541128873825073e-06, 4.850327968597412e-06, 5.159527063369751e-06, 5.46872615814209e-06, 5.777925252914429e-06, 6.087124347686768e-06, 6.3963234424591064e-06, 6.705522537231445e-06, 7.014721632003784e-06, 7.323920726776123e-06, 7.633119821548462e-06, 7.9423189163208e-06, 8.25151801109314e-06, 8.560717105865479e-06, 8.869916200637817e-06, 9.179115295410156e-06]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 3.0, 10.0, 10.0, 11.0, 13.0, 29.0, 35.0, 43.0, 63.0, 105.0, 107.0, 181.0, 211.0, 316.0, 454.0, 576.0, 846.0, 1278.0, 1733.0, 2552.0, 3742.0, 5694.0, 8990.0, 13989.0, 23207.0, 40640.0, 79345.0, 196243.0, 397777.0, 126635.0, 58866.0, 32034.0, 18836.0, 11363.0, 7269.0, 4724.0, 3225.0, 2152.0, 1545.0, 1049.0, 746.0, 527.0, 411.0, 241.0, 210.0, 146.0, 109.0, 81.0, 49.0, 46.0, 33.0, 26.0, 12.0, 9.0, 5.0, 9.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.109375, -0.105987548828125, -0.10260009765625, -0.099212646484375, -0.0958251953125, -0.092437744140625, -0.08905029296875, -0.085662841796875, -0.082275390625, -0.078887939453125, -0.07550048828125, -0.072113037109375, -0.0687255859375, -0.065338134765625, -0.06195068359375, -0.058563232421875, -0.05517578125, -0.051788330078125, -0.04840087890625, -0.045013427734375, -0.0416259765625, -0.038238525390625, -0.03485107421875, -0.031463623046875, -0.028076171875, -0.024688720703125, -0.02130126953125, -0.017913818359375, -0.0145263671875, -0.011138916015625, -0.00775146484375, -0.004364013671875, -0.0009765625, 0.002410888671875, 0.00579833984375, 0.009185791015625, 0.0125732421875, 0.015960693359375, 0.01934814453125, 0.022735595703125, 0.026123046875, 0.029510498046875, 0.03289794921875, 0.036285400390625, 0.0396728515625, 0.043060302734375, 0.04644775390625, 0.049835205078125, 0.05322265625, 0.056610107421875, 0.05999755859375, 0.063385009765625, 0.0667724609375, 0.070159912109375, 0.07354736328125, 0.076934814453125, 0.080322265625, 0.083709716796875, 0.08709716796875, 0.090484619140625, 0.0938720703125, 0.097259521484375, 0.10064697265625, 0.104034423828125, 0.107421875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 9.0, 6.0, 5.0, 9.0, 8.0, 5.0, 9.0, 6.0, 10.0, 18.0, 17.0, 17.0, 26.0, 33.0, 27.0, 30.0, 44.0, 68.0, 98.0, 111.0, 70.0, 69.0, 56.0, 45.0, 29.0, 29.0, 18.0, 22.0, 20.0, 14.0, 10.0, 6.0, 14.0, 9.0, 3.0, 4.0, 2.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036590576171875, -0.03549385070800781, -0.034397125244140625, -0.03330039978027344, -0.03220367431640625, -0.031106948852539062, -0.030010223388671875, -0.028913497924804688, -0.0278167724609375, -0.026720046997070312, -0.025623321533203125, -0.024526596069335938, -0.02342987060546875, -0.022333145141601562, -0.021236419677734375, -0.020139694213867188, -0.01904296875, -0.017946243286132812, -0.016849517822265625, -0.015752792358398438, -0.01465606689453125, -0.013559341430664062, -0.012462615966796875, -0.011365890502929688, -0.0102691650390625, -0.009172439575195312, -0.008075714111328125, -0.0069789886474609375, -0.00588226318359375, -0.0047855377197265625, -0.003688812255859375, -0.0025920867919921875, -0.001495361328125, -0.0003986358642578125, 0.000698089599609375, 0.0017948150634765625, 0.00289154052734375, 0.0039882659912109375, 0.005084991455078125, 0.0061817169189453125, 0.0072784423828125, 0.008375167846679688, 0.009471893310546875, 0.010568618774414062, 0.01166534423828125, 0.012762069702148438, 0.013858795166015625, 0.014955520629882812, 0.01605224609375, 0.017148971557617188, 0.018245697021484375, 0.019342422485351562, 0.02043914794921875, 0.021535873413085938, 0.022632598876953125, 0.023729324340820312, 0.0248260498046875, 0.025922775268554688, 0.027019500732421875, 0.028116226196289062, 0.02921295166015625, 0.030309677124023438, 0.031406402587890625, 0.03250312805175781, 0.033599853515625]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 7.0, 10.0, 13.0, 18.0, 23.0, 33.0, 41.0, 78.0, 84.0, 104.0, 128.0, 101.0, 96.0, 76.0, 47.0, 43.0, 30.0, 11.0, 11.0, 12.0, 5.0, 6.0, 6.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.896960496902466, -3.7775113582611084, -3.658062219619751, -3.5386130809783936, -3.419163942337036, -3.2997148036956787, -3.180265426635742, -3.0608162879943848, -2.9413671493530273, -2.82191801071167, -2.7024688720703125, -2.583019733428955, -2.4635705947875977, -2.3441214561462402, -2.224672317504883, -2.1052231788635254, -1.985774040222168, -1.8663249015808105, -1.7468757629394531, -1.6274266242980957, -1.5079774856567383, -1.3885283470153809, -1.2690790891647339, -1.1496299505233765, -1.030180811882019, -0.9107316732406616, -0.7912825345993042, -0.671833336353302, -0.5523841977119446, -0.43293505907058716, -0.31348586082458496, -0.19403672218322754, -0.07458782196044922, 0.0448613315820694, 0.164310485124588, 0.2837596535682678, 0.40320879220962524, 0.5226579308509827, 0.6421071290969849, 0.7615562677383423, 0.8810054063796997, 1.0004545450210571, 1.1199036836624146, 1.2393529415130615, 1.358802080154419, 1.4782512187957764, 1.5977003574371338, 1.7171494960784912, 1.8365986347198486, 1.956047773361206, 2.0754969120025635, 2.194946050643921, 2.3143951892852783, 2.4338443279266357, 2.5532937049865723, 2.6727428436279297, 2.792191982269287, 2.9116411209106445, 3.031090259552002, 3.1505393981933594, 3.269988536834717, 3.389437675476074, 3.5088868141174316, 3.628335952758789, 3.7477850914001465]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 2.0, 8.0, 4.0, 9.0, 9.0, 11.0, 14.0, 26.0, 18.0, 26.0, 23.0, 19.0, 26.0, 22.0, 21.0, 31.0, 33.0, 34.0, 47.0, 39.0, 50.0, 30.0, 43.0, 45.0, 45.0, 26.0, 35.0, 33.0, 33.0, 24.0, 20.0, 28.0, 16.0, 22.0, 19.0, 13.0, 17.0, 13.0, 20.0, 7.0, 8.0, 6.0, 11.0, 4.0, 3.0, 2.0, 0.0, 5.0, 1.0, 0.0, 3.0, 2.0], "bins": [-2.1782519817352295, -2.113868236541748, -2.0494847297668457, -1.9851009845733643, -1.9207173585891724, -1.8563337326049805, -1.791949987411499, -1.7275663614273071, -1.6631827354431152, -1.5987991094589233, -1.534415364265442, -1.47003173828125, -1.405648112297058, -1.3412644863128662, -1.2768807411193848, -1.2124971151351929, -1.1481133699417114, -1.0837297439575195, -1.019345998764038, -0.9549623727798462, -0.8905787467956543, -0.8261950612068176, -0.761811375617981, -0.6974277496337891, -0.6330440640449524, -0.5686603784561157, -0.5042767524719238, -0.43989306688308716, -0.3755094110965729, -0.3111257553100586, -0.24674206972122192, -0.18235841393470764, -0.11797463893890381, -0.05359097570180893, 0.01079268753528595, 0.07517635822296143, 0.1395600140094757, 0.20394366979599, 0.26832735538482666, 0.33271101117134094, 0.3970946669578552, 0.4614783227443695, 0.5258619785308838, 0.5902456641197205, 0.6546293497085571, 0.719012975692749, 0.7833966612815857, 0.8477803468704224, 0.9121639728546143, 0.9765476584434509, 1.0409313440322876, 1.1053149700164795, 1.1696985960006714, 1.2340822219848633, 1.2984659671783447, 1.3628495931625366, 1.4272332191467285, 1.4916168451309204, 1.5560005903244019, 1.6203842163085938, 1.6847678422927856, 1.7491514682769775, 1.813535213470459, 1.8779188394546509, 1.9423025846481323]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 8.0, 14.0, 10.0, 27.0, 43.0, 55.0, 87.0, 129.0, 179.0, 272.0, 443.0, 691.0, 1087.0, 1721.0, 2931.0, 5055.0, 8753.0, 15663.0, 28579.0, 55297.0, 110730.0, 249546.0, 293715.0, 133045.0, 64378.0, 33660.0, 17967.0, 9871.0, 5748.0, 3437.0, 1977.0, 1245.0, 771.0, 521.0, 316.0, 184.0, 137.0, 81.0, 63.0, 43.0, 27.0, 20.0, 10.0, 11.0, 9.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2109375, -4.07562255859375, -3.9403076171875, -3.80499267578125, -3.669677734375, -3.53436279296875, -3.3990478515625, -3.26373291015625, -3.12841796875, -2.99310302734375, -2.8577880859375, -2.72247314453125, -2.587158203125, -2.45184326171875, -2.3165283203125, -2.18121337890625, -2.0458984375, -1.91058349609375, -1.7752685546875, -1.63995361328125, -1.504638671875, -1.36932373046875, -1.2340087890625, -1.09869384765625, -0.96337890625, -0.82806396484375, -0.6927490234375, -0.55743408203125, -0.422119140625, -0.28680419921875, -0.1514892578125, -0.01617431640625, 0.119140625, 0.25445556640625, 0.3897705078125, 0.52508544921875, 0.660400390625, 0.79571533203125, 0.9310302734375, 1.06634521484375, 1.20166015625, 1.33697509765625, 1.4722900390625, 1.60760498046875, 1.742919921875, 1.87823486328125, 2.0135498046875, 2.14886474609375, 2.2841796875, 2.41949462890625, 2.5548095703125, 2.69012451171875, 2.825439453125, 2.96075439453125, 3.0960693359375, 3.23138427734375, 3.36669921875, 3.50201416015625, 3.6373291015625, 3.77264404296875, 3.907958984375, 4.04327392578125, 4.1785888671875, 4.31390380859375, 4.44921875]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0, 7.0, 3.0, 6.0, 8.0, 7.0, 14.0, 20.0, 14.0, 18.0, 25.0, 18.0, 20.0, 30.0, 26.0, 23.0, 31.0, 25.0, 44.0, 38.0, 41.0, 37.0, 40.0, 42.0, 44.0, 54.0, 44.0, 29.0, 27.0, 38.0, 32.0, 21.0, 19.0, 23.0, 26.0, 17.0, 12.0, 18.0, 6.0, 11.0, 14.0, 9.0, 6.0, 8.0, 2.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.041015625, -1.9806060791015625, -1.920196533203125, -1.8597869873046875, -1.79937744140625, -1.7389678955078125, -1.678558349609375, -1.6181488037109375, -1.5577392578125, -1.4973297119140625, -1.436920166015625, -1.3765106201171875, -1.31610107421875, -1.2556915283203125, -1.195281982421875, -1.1348724365234375, -1.074462890625, -1.0140533447265625, -0.953643798828125, -0.8932342529296875, -0.83282470703125, -0.7724151611328125, -0.712005615234375, -0.6515960693359375, -0.5911865234375, -0.5307769775390625, -0.470367431640625, -0.4099578857421875, -0.34954833984375, -0.2891387939453125, -0.228729248046875, -0.1683197021484375, -0.10791015625, -0.0475006103515625, 0.012908935546875, 0.0733184814453125, 0.13372802734375, 0.1941375732421875, 0.254547119140625, 0.3149566650390625, 0.3753662109375, 0.4357757568359375, 0.496185302734375, 0.5565948486328125, 0.61700439453125, 0.6774139404296875, 0.737823486328125, 0.7982330322265625, 0.858642578125, 0.9190521240234375, 0.979461669921875, 1.0398712158203125, 1.10028076171875, 1.1606903076171875, 1.221099853515625, 1.2815093994140625, 1.3419189453125, 1.4023284912109375, 1.462738037109375, 1.5231475830078125, 1.58355712890625, 1.6439666748046875, 1.704376220703125, 1.7647857666015625, 1.8251953125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 6.0, 0.0, 6.0, 13.0, 17.0, 26.0, 27.0, 42.0, 76.0, 108.0, 174.0, 262.0, 404.0, 630.0, 1136.0, 1742.0, 3026.0, 5033.0, 8914.0, 15755.0, 28420.0, 53144.0, 100906.0, 207106.0, 296834.0, 153127.0, 77737.0, 41471.0, 22338.0, 12618.0, 7073.0, 4086.0, 2433.0, 1435.0, 931.0, 525.0, 323.0, 255.0, 115.0, 102.0, 56.0, 53.0, 20.0, 16.0, 16.0, 10.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.708984375, -3.586578369140625, -3.46417236328125, -3.341766357421875, -3.2193603515625, -3.096954345703125, -2.97454833984375, -2.852142333984375, -2.729736328125, -2.607330322265625, -2.48492431640625, -2.362518310546875, -2.2401123046875, -2.117706298828125, -1.99530029296875, -1.872894287109375, -1.75048828125, -1.628082275390625, -1.50567626953125, -1.383270263671875, -1.2608642578125, -1.138458251953125, -1.01605224609375, -0.893646240234375, -0.771240234375, -0.648834228515625, -0.52642822265625, -0.404022216796875, -0.2816162109375, -0.159210205078125, -0.03680419921875, 0.085601806640625, 0.2080078125, 0.330413818359375, 0.45281982421875, 0.575225830078125, 0.6976318359375, 0.820037841796875, 0.94244384765625, 1.064849853515625, 1.187255859375, 1.309661865234375, 1.43206787109375, 1.554473876953125, 1.6768798828125, 1.799285888671875, 1.92169189453125, 2.044097900390625, 2.16650390625, 2.288909912109375, 2.41131591796875, 2.533721923828125, 2.6561279296875, 2.778533935546875, 2.90093994140625, 3.023345947265625, 3.145751953125, 3.268157958984375, 3.39056396484375, 3.512969970703125, 3.6353759765625, 3.757781982421875, 3.88018798828125, 4.002593994140625, 4.125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 5.0, 7.0, 4.0, 10.0, 8.0, 16.0, 20.0, 10.0, 19.0, 21.0, 19.0, 33.0, 30.0, 34.0, 36.0, 31.0, 39.0, 36.0, 44.0, 50.0, 38.0, 30.0, 37.0, 37.0, 29.0, 33.0, 38.0, 37.0, 34.0, 30.0, 23.0, 27.0, 15.0, 21.0, 14.0, 8.0, 18.0, 9.0, 11.0, 14.0, 7.0, 3.0, 4.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-1.333984375, -1.2951202392578125, -1.256256103515625, -1.2173919677734375, -1.17852783203125, -1.1396636962890625, -1.100799560546875, -1.0619354248046875, -1.0230712890625, -0.9842071533203125, -0.945343017578125, -0.9064788818359375, -0.86761474609375, -0.8287506103515625, -0.789886474609375, -0.7510223388671875, -0.712158203125, -0.6732940673828125, -0.634429931640625, -0.5955657958984375, -0.55670166015625, -0.5178375244140625, -0.478973388671875, -0.4401092529296875, -0.4012451171875, -0.3623809814453125, -0.323516845703125, -0.2846527099609375, -0.24578857421875, -0.2069244384765625, -0.168060302734375, -0.1291961669921875, -0.09033203125, -0.0514678955078125, -0.012603759765625, 0.0262603759765625, 0.06512451171875, 0.1039886474609375, 0.142852783203125, 0.1817169189453125, 0.2205810546875, 0.2594451904296875, 0.298309326171875, 0.3371734619140625, 0.37603759765625, 0.4149017333984375, 0.453765869140625, 0.4926300048828125, 0.531494140625, 0.5703582763671875, 0.609222412109375, 0.6480865478515625, 0.68695068359375, 0.7258148193359375, 0.764678955078125, 0.8035430908203125, 0.8424072265625, 0.8812713623046875, 0.920135498046875, 0.9589996337890625, 0.99786376953125, 1.0367279052734375, 1.075592041015625, 1.1144561767578125, 1.1533203125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 1.0, 2.0, 1.0, 11.0, 9.0, 12.0, 32.0, 38.0, 41.0, 74.0, 88.0, 128.0, 191.0, 314.0, 466.0, 724.0, 1109.0, 1765.0, 3014.0, 5304.0, 9236.0, 17704.0, 37673.0, 99677.0, 642830.0, 136116.0, 45411.0, 20928.0, 10633.0, 5985.0, 3317.0, 2070.0, 1285.0, 805.0, 505.0, 347.0, 216.0, 160.0, 96.0, 74.0, 42.0, 41.0, 26.0, 14.0, 13.0, 10.0, 8.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.630859375, -3.51953125, -3.408203125, -3.296875, -3.185546875, -3.07421875, -2.962890625, -2.8515625, -2.740234375, -2.62890625, -2.517578125, -2.40625, -2.294921875, -2.18359375, -2.072265625, -1.9609375, -1.849609375, -1.73828125, -1.626953125, -1.515625, -1.404296875, -1.29296875, -1.181640625, -1.0703125, -0.958984375, -0.84765625, -0.736328125, -0.625, -0.513671875, -0.40234375, -0.291015625, -0.1796875, -0.068359375, 0.04296875, 0.154296875, 0.265625, 0.376953125, 0.48828125, 0.599609375, 0.7109375, 0.822265625, 0.93359375, 1.044921875, 1.15625, 1.267578125, 1.37890625, 1.490234375, 1.6015625, 1.712890625, 1.82421875, 1.935546875, 2.046875, 2.158203125, 2.26953125, 2.380859375, 2.4921875, 2.603515625, 2.71484375, 2.826171875, 2.9375, 3.048828125, 3.16015625, 3.271484375, 3.3828125, 3.494140625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 4.0, 4.0, 4.0, 6.0, 9.0, 14.0, 12.0, 23.0, 21.0, 34.0, 54.0, 100.0, 268.0, 181.0, 99.0, 47.0, 29.0, 29.0, 10.0, 13.0, 12.0, 5.0, 9.0, 4.0, 1.0, 4.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00012063980102539062, -0.00011559948325157166, -0.00011055916547775269, -0.00010551884770393372, -0.00010047852993011475, -9.543821215629578e-05, -9.03978943824768e-05, -8.535757660865784e-05, -8.031725883483887e-05, -7.52769410610199e-05, -7.023662328720093e-05, -6.519630551338196e-05, -6.015598773956299e-05, -5.511566996574402e-05, -5.007535219192505e-05, -4.503503441810608e-05, -3.999471664428711e-05, -3.495439887046814e-05, -2.991408109664917e-05, -2.48737633228302e-05, -1.983344554901123e-05, -1.479312777519226e-05, -9.752810001373291e-06, -4.712492227554321e-06, 3.2782554626464844e-07, 5.368143320083618e-06, 1.0408461093902588e-05, 1.5448778867721558e-05, 2.0489096641540527e-05, 2.5529414415359497e-05, 3.056973218917847e-05, 3.5610049962997437e-05, 4.0650367736816406e-05, 4.5690685510635376e-05, 5.0731003284454346e-05, 5.5771321058273315e-05, 6.0811638832092285e-05, 6.585195660591125e-05, 7.089227437973022e-05, 7.59325921535492e-05, 8.097290992736816e-05, 8.601322770118713e-05, 9.10535454750061e-05, 9.609386324882507e-05, 0.00010113418102264404, 0.00010617449879646301, 0.00011121481657028198, 0.00011625513434410095, 0.00012129545211791992, 0.0001263357698917389, 0.00013137608766555786, 0.00013641640543937683, 0.0001414567232131958, 0.00014649704098701477, 0.00015153735876083374, 0.0001565776765346527, 0.00016161799430847168, 0.00016665831208229065, 0.00017169862985610962, 0.0001767389476299286, 0.00018177926540374756, 0.00018681958317756653, 0.0001918599009513855, 0.00019690021872520447, 0.00020194053649902344]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 7.0, 5.0, 12.0, 15.0, 22.0, 18.0, 41.0, 62.0, 85.0, 111.0, 158.0, 208.0, 312.0, 482.0, 702.0, 1046.0, 1698.0, 2741.0, 4416.0, 7782.0, 14096.0, 28103.0, 65358.0, 500037.0, 299088.0, 61751.0, 27020.0, 13796.0, 7567.0, 4367.0, 2606.0, 1662.0, 1064.0, 667.0, 454.0, 316.0, 225.0, 128.0, 100.0, 64.0, 56.0, 31.0, 24.0, 15.0, 18.0, 5.0, 8.0, 6.0, 4.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.39453125, -3.288360595703125, -3.18218994140625, -3.076019287109375, -2.9698486328125, -2.863677978515625, -2.75750732421875, -2.651336669921875, -2.545166015625, -2.438995361328125, -2.33282470703125, -2.226654052734375, -2.1204833984375, -2.014312744140625, -1.90814208984375, -1.801971435546875, -1.69580078125, -1.589630126953125, -1.48345947265625, -1.377288818359375, -1.2711181640625, -1.164947509765625, -1.05877685546875, -0.952606201171875, -0.846435546875, -0.740264892578125, -0.63409423828125, -0.527923583984375, -0.4217529296875, -0.315582275390625, -0.20941162109375, -0.103240966796875, 0.0029296875, 0.109100341796875, 0.21527099609375, 0.321441650390625, 0.4276123046875, 0.533782958984375, 0.63995361328125, 0.746124267578125, 0.852294921875, 0.958465576171875, 1.06463623046875, 1.170806884765625, 1.2769775390625, 1.383148193359375, 1.48931884765625, 1.595489501953125, 1.70166015625, 1.807830810546875, 1.91400146484375, 2.020172119140625, 2.1263427734375, 2.232513427734375, 2.33868408203125, 2.444854736328125, 2.551025390625, 2.657196044921875, 2.76336669921875, 2.869537353515625, 2.9757080078125, 3.081878662109375, 3.18804931640625, 3.294219970703125, 3.400390625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 2.0, 7.0, 7.0, 12.0, 15.0, 17.0, 18.0, 29.0, 37.0, 38.0, 53.0, 73.0, 194.0, 179.0, 65.0, 56.0, 39.0, 20.0, 30.0, 14.0, 17.0, 13.0, 12.0, 5.0, 14.0, 8.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.97119140625, -0.9408416748046875, -0.910491943359375, -0.8801422119140625, -0.84979248046875, -0.8194427490234375, -0.789093017578125, -0.7587432861328125, -0.7283935546875, -0.6980438232421875, -0.667694091796875, -0.6373443603515625, -0.60699462890625, -0.5766448974609375, -0.546295166015625, -0.5159454345703125, -0.485595703125, -0.4552459716796875, -0.424896240234375, -0.3945465087890625, -0.36419677734375, -0.3338470458984375, -0.303497314453125, -0.2731475830078125, -0.2427978515625, -0.2124481201171875, -0.182098388671875, -0.1517486572265625, -0.12139892578125, -0.0910491943359375, -0.060699462890625, -0.0303497314453125, 0.0, 0.0303497314453125, 0.060699462890625, 0.0910491943359375, 0.12139892578125, 0.1517486572265625, 0.182098388671875, 0.2124481201171875, 0.2427978515625, 0.2731475830078125, 0.303497314453125, 0.3338470458984375, 0.36419677734375, 0.3945465087890625, 0.424896240234375, 0.4552459716796875, 0.485595703125, 0.5159454345703125, 0.546295166015625, 0.5766448974609375, 0.60699462890625, 0.6373443603515625, 0.667694091796875, 0.6980438232421875, 0.7283935546875, 0.7587432861328125, 0.789093017578125, 0.8194427490234375, 0.84979248046875, 0.8801422119140625, 0.910491943359375, 0.9408416748046875, 0.97119140625]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 4.0, 6.0, 7.0, 10.0, 11.0, 15.0, 15.0, 24.0, 33.0, 47.0, 57.0, 66.0, 107.0, 129.0, 114.0, 77.0, 55.0, 50.0, 30.0, 31.0, 25.0, 18.0, 16.0, 13.0, 7.0, 7.0, 5.0, 2.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7730987071990967, -2.675766706466675, -2.578434944152832, -2.48110294342041, -2.3837709426879883, -2.2864391803741455, -2.1891071796417236, -2.091775417327881, -1.994443416595459, -1.8971115350723267, -1.7997795343399048, -1.7024476528167725, -1.6051157712936401, -1.5077838897705078, -1.410451889038086, -1.3131200075149536, -1.2157880067825317, -1.1184561252593994, -1.0211241245269775, -0.9237922430038452, -0.8264603614807129, -0.7291284203529358, -0.6317964792251587, -0.5344645977020264, -0.43713265657424927, -0.33980074524879456, -0.24246881902217865, -0.14513689279556274, -0.04780498147010803, 0.04952692985534668, 0.14685887098312378, 0.2441907525062561, 0.3415226936340332, 0.4388546049594879, 0.5361865162849426, 0.6335184574127197, 0.730850338935852, 0.8281822800636292, 0.9255142211914062, 1.0228461027145386, 1.120177984237671, 1.2175098657608032, 1.314841866493225, 1.4121737480163574, 1.5095056295394897, 1.606837511062622, 1.704169511795044, 1.8015013933181763, 1.8988333940505981, 1.9961652755737305, 2.0934972763061523, 2.190829277038574, 2.288161039352417, 2.385493040084839, 2.4828248023986816, 2.5801568031311035, 2.6774888038635254, 2.7748208045959473, 2.87215256690979, 2.969484567642212, 3.066816568374634, 3.1641483306884766, 3.2614803314208984, 3.3588123321533203, 3.456144094467163]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 3.0, 5.0, 3.0, 2.0, 10.0, 13.0, 13.0, 21.0, 14.0, 22.0, 24.0, 23.0, 34.0, 22.0, 26.0, 29.0, 23.0, 30.0, 41.0, 49.0, 48.0, 44.0, 47.0, 34.0, 46.0, 46.0, 42.0, 31.0, 41.0, 26.0, 29.0, 22.0, 20.0, 19.0, 19.0, 12.0, 8.0, 15.0, 9.0, 10.0, 4.0, 8.0, 9.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.214357614517212, -2.147066593170166, -2.07977557182312, -2.012484550476074, -1.9451935291290283, -1.8779025077819824, -1.810611367225647, -1.743320345878601, -1.6760293245315552, -1.6087383031845093, -1.5414472818374634, -1.4741562604904175, -1.406865119934082, -1.3395740985870361, -1.2722830772399902, -1.2049920558929443, -1.1377010345458984, -1.0704100131988525, -1.0031189918518066, -0.935827910900116, -0.8685368895530701, -0.8012458682060242, -0.7339547872543335, -0.6666637659072876, -0.5993727445602417, -0.5320817232131958, -0.4647906720638275, -0.39749962091445923, -0.33020859956741333, -0.26291757822036743, -0.19562652707099915, -0.12833547592163086, -0.06104445457458496, 0.006246581673622131, 0.07353761792182922, 0.14082865417003632, 0.2081196904182434, 0.2754107117652893, 0.3427017629146576, 0.4099928140640259, 0.4772838354110718, 0.5445748567581177, 0.6118658781051636, 0.6791569590568542, 0.7464479804039001, 0.813739001750946, 0.8810300827026367, 0.9483211040496826, 1.0156121253967285, 1.0829031467437744, 1.1501941680908203, 1.2174851894378662, 1.284776210784912, 1.352067232131958, 1.4193583726882935, 1.4866493940353394, 1.5539404153823853, 1.6212314367294312, 1.688522458076477, 1.755813479423523, 1.8231046199798584, 1.8903956413269043, 1.9576866626739502, 2.024977684020996, 2.092268705368042]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 7.0, 13.0, 11.0, 15.0, 24.0, 41.0, 40.0, 59.0, 112.0, 134.0, 173.0, 242.0, 289.0, 430.0, 539.0, 822.0, 1164.0, 1617.0, 2219.0, 3080.0, 4238.0, 5947.0, 8712.0, 12623.0, 18738.0, 27891.0, 43183.0, 68551.0, 113476.0, 207468.0, 492117.0, 1361290.0, 1031658.0, 357470.0, 164592.0, 93905.0, 57586.0, 36768.0, 24379.0, 16155.0, 10999.0, 7596.0, 5365.0, 3800.0, 2628.0, 1900.0, 1260.0, 936.0, 686.0, 464.0, 322.0, 191.0, 131.0, 93.0, 57.0, 42.0, 20.0, 13.0, 8.0, 6.0, 2.0, 1.0], "bins": [-2.373046875, -2.30291748046875, -2.2327880859375, -2.16265869140625, -2.092529296875, -2.02239990234375, -1.9522705078125, -1.88214111328125, -1.81201171875, -1.74188232421875, -1.6717529296875, -1.60162353515625, -1.531494140625, -1.46136474609375, -1.3912353515625, -1.32110595703125, -1.2509765625, -1.18084716796875, -1.1107177734375, -1.04058837890625, -0.970458984375, -0.90032958984375, -0.8302001953125, -0.76007080078125, -0.68994140625, -0.61981201171875, -0.5496826171875, -0.47955322265625, -0.409423828125, -0.33929443359375, -0.2691650390625, -0.19903564453125, -0.12890625, -0.05877685546875, 0.0113525390625, 0.08148193359375, 0.151611328125, 0.22174072265625, 0.2918701171875, 0.36199951171875, 0.43212890625, 0.50225830078125, 0.5723876953125, 0.64251708984375, 0.712646484375, 0.78277587890625, 0.8529052734375, 0.92303466796875, 0.9931640625, 1.06329345703125, 1.1334228515625, 1.20355224609375, 1.273681640625, 1.34381103515625, 1.4139404296875, 1.48406982421875, 1.55419921875, 1.62432861328125, 1.6944580078125, 1.76458740234375, 1.834716796875, 1.90484619140625, 1.9749755859375, 2.04510498046875, 2.115234375]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 8.0, 5.0, 5.0, 11.0, 16.0, 11.0, 17.0, 18.0, 25.0, 21.0, 26.0, 27.0, 28.0, 27.0, 20.0, 48.0, 46.0, 57.0, 44.0, 37.0, 52.0, 41.0, 50.0, 48.0, 54.0, 33.0, 25.0, 34.0, 28.0, 22.0, 17.0, 16.0, 15.0, 12.0, 8.0, 8.0, 11.0, 9.0, 6.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.5947265625, -1.5489959716796875, -1.503265380859375, -1.4575347900390625, -1.41180419921875, -1.3660736083984375, -1.320343017578125, -1.2746124267578125, -1.2288818359375, -1.1831512451171875, -1.137420654296875, -1.0916900634765625, -1.04595947265625, -1.0002288818359375, -0.954498291015625, -0.9087677001953125, -0.863037109375, -0.8173065185546875, -0.771575927734375, -0.7258453369140625, -0.68011474609375, -0.6343841552734375, -0.588653564453125, -0.5429229736328125, -0.4971923828125, -0.4514617919921875, -0.405731201171875, -0.3600006103515625, -0.31427001953125, -0.2685394287109375, -0.222808837890625, -0.1770782470703125, -0.13134765625, -0.0856170654296875, -0.039886474609375, 0.0058441162109375, 0.05157470703125, 0.0973052978515625, 0.143035888671875, 0.1887664794921875, 0.2344970703125, 0.2802276611328125, 0.325958251953125, 0.3716888427734375, 0.41741943359375, 0.4631500244140625, 0.508880615234375, 0.5546112060546875, 0.600341796875, 0.6460723876953125, 0.691802978515625, 0.7375335693359375, 0.78326416015625, 0.8289947509765625, 0.874725341796875, 0.9204559326171875, 0.9661865234375, 1.0119171142578125, 1.057647705078125, 1.1033782958984375, 1.14910888671875, 1.1948394775390625, 1.240570068359375, 1.2863006591796875, 1.33203125]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 4.0, 6.0, 17.0, 23.0, 26.0, 48.0, 60.0, 90.0, 126.0, 180.0, 280.0, 370.0, 518.0, 796.0, 1206.0, 1652.0, 2507.0, 3574.0, 5493.0, 8337.0, 12815.0, 19923.0, 31882.0, 52225.0, 88551.0, 156253.0, 299499.0, 662123.0, 1391198.0, 725389.0, 321613.0, 165721.0, 92600.0, 54606.0, 33455.0, 21033.0, 13584.0, 8617.0, 5820.0, 3894.0, 2591.0, 1783.0, 1198.0, 816.0, 539.0, 385.0, 263.0, 195.0, 142.0, 84.0, 58.0, 48.0, 22.0, 18.0, 15.0, 10.0, 4.0, 4.0, 2.0, 2.0, 2.0], "bins": [-2.048828125, -1.98388671875, -1.9189453125, -1.85400390625, -1.7890625, -1.72412109375, -1.6591796875, -1.59423828125, -1.529296875, -1.46435546875, -1.3994140625, -1.33447265625, -1.26953125, -1.20458984375, -1.1396484375, -1.07470703125, -1.009765625, -0.94482421875, -0.8798828125, -0.81494140625, -0.75, -0.68505859375, -0.6201171875, -0.55517578125, -0.490234375, -0.42529296875, -0.3603515625, -0.29541015625, -0.23046875, -0.16552734375, -0.1005859375, -0.03564453125, 0.029296875, 0.09423828125, 0.1591796875, 0.22412109375, 0.2890625, 0.35400390625, 0.4189453125, 0.48388671875, 0.548828125, 0.61376953125, 0.6787109375, 0.74365234375, 0.80859375, 0.87353515625, 0.9384765625, 1.00341796875, 1.068359375, 1.13330078125, 1.1982421875, 1.26318359375, 1.328125, 1.39306640625, 1.4580078125, 1.52294921875, 1.587890625, 1.65283203125, 1.7177734375, 1.78271484375, 1.84765625, 1.91259765625, 1.9775390625, 2.04248046875, 2.107421875]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 10.0, 8.0, 7.0, 19.0, 14.0, 23.0, 37.0, 42.0, 51.0, 78.0, 77.0, 79.0, 99.0, 107.0, 125.0, 146.0, 195.0, 185.0, 243.0, 212.0, 236.0, 254.0, 257.0, 217.0, 217.0, 170.0, 151.0, 152.0, 123.0, 87.0, 87.0, 68.0, 47.0, 59.0, 35.0, 25.0, 22.0, 30.0, 18.0, 14.0, 15.0, 7.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0], "bins": [-0.7333984375, -0.71197509765625, -0.6905517578125, -0.66912841796875, -0.647705078125, -0.62628173828125, -0.6048583984375, -0.58343505859375, -0.56201171875, -0.54058837890625, -0.5191650390625, -0.49774169921875, -0.476318359375, -0.45489501953125, -0.4334716796875, -0.41204833984375, -0.390625, -0.36920166015625, -0.3477783203125, -0.32635498046875, -0.304931640625, -0.28350830078125, -0.2620849609375, -0.24066162109375, -0.21923828125, -0.19781494140625, -0.1763916015625, -0.15496826171875, -0.133544921875, -0.11212158203125, -0.0906982421875, -0.06927490234375, -0.0478515625, -0.02642822265625, -0.0050048828125, 0.01641845703125, 0.037841796875, 0.05926513671875, 0.0806884765625, 0.10211181640625, 0.12353515625, 0.14495849609375, 0.1663818359375, 0.18780517578125, 0.209228515625, 0.23065185546875, 0.2520751953125, 0.27349853515625, 0.294921875, 0.31634521484375, 0.3377685546875, 0.35919189453125, 0.380615234375, 0.40203857421875, 0.4234619140625, 0.44488525390625, 0.46630859375, 0.48773193359375, 0.5091552734375, 0.53057861328125, 0.552001953125, 0.57342529296875, 0.5948486328125, 0.61627197265625, 0.6376953125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 2.0, 1.0, 8.0, 5.0, 13.0, 10.0, 20.0, 19.0, 21.0, 19.0, 43.0, 53.0, 51.0, 88.0, 92.0, 92.0, 83.0, 79.0, 84.0, 47.0, 28.0, 26.0, 25.0, 16.0, 17.0, 13.0, 11.0, 6.0, 3.0, 4.0, 2.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7385151386260986, -1.675258994102478, -1.6120028495788574, -1.5487467050552368, -1.4854905605316162, -1.422234296798706, -1.3589781522750854, -1.2957220077514648, -1.2324658632278442, -1.1692097187042236, -1.105953574180603, -1.0426974296569824, -0.979441225528717, -0.9161850810050964, -0.852928876876831, -0.7896727323532104, -0.7264165878295898, -0.6631604433059692, -0.5999042987823486, -0.5366480946540833, -0.47339195013046265, -0.41013580560684204, -0.34687963128089905, -0.28362345695495605, -0.22036731243133545, -0.15711115300655365, -0.09385499358177185, -0.03059883415699005, 0.03265732526779175, 0.09591346979141235, 0.15916964411735535, 0.22242581844329834, 0.28568220138549805, 0.34893834590911865, 0.41219452023506165, 0.47545069456100464, 0.5387068390846252, 0.6019629836082458, 0.6652191877365112, 0.7284753322601318, 0.7917314767837524, 0.854987621307373, 0.9182437658309937, 0.981499969959259, 1.0447561740875244, 1.1080121994018555, 1.1712684631347656, 1.2345246076583862, 1.2977807521820068, 1.3610368967056274, 1.424293041229248, 1.4875491857528687, 1.5508053302764893, 1.6140615940093994, 1.67731773853302, 1.7405738830566406, 1.8038300275802612, 1.8670861721038818, 1.9303423166275024, 1.993598461151123, 2.056854724884033, 2.1201107501983643, 2.1833670139312744, 2.2466230392456055, 2.3098793029785156]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 4.0, 4.0, 11.0, 3.0, 8.0, 11.0, 11.0, 16.0, 13.0, 18.0, 19.0, 22.0, 27.0, 41.0, 30.0, 21.0, 31.0, 31.0, 39.0, 37.0, 35.0, 37.0, 41.0, 39.0, 39.0, 39.0, 39.0, 34.0, 37.0, 27.0, 37.0, 28.0, 34.0, 24.0, 17.0, 18.0, 15.0, 10.0, 11.0, 9.0, 6.0, 7.0, 7.0, 7.0, 8.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.595834732055664, -1.5498061180114746, -1.5037776231765747, -1.4577490091323853, -1.4117205142974854, -1.365691900253296, -1.3196632862091064, -1.273634672164917, -1.227606177330017, -1.1815775632858276, -1.1355490684509277, -1.0895204544067383, -1.0434918403625488, -0.9974633455276489, -0.9514347314834595, -0.9054061770439148, -0.8593776226043701, -0.8133490681648254, -0.7673205137252808, -0.7212918996810913, -0.6752633452415466, -0.629234790802002, -0.5832061767578125, -0.5371776223182678, -0.49114906787872314, -0.44512051343917847, -0.3990919291973114, -0.35306334495544434, -0.30703479051589966, -0.261006236076355, -0.21497765183448792, -0.16894906759262085, -0.12292039394378662, -0.07689182460308075, -0.030863255262374878, 0.015165314078330994, 0.061193883419036865, 0.10722245275974274, 0.1532510221004486, 0.19927960634231567, 0.24530816078186035, 0.29133671522140503, 0.3373652994632721, 0.38339388370513916, 0.42942243814468384, 0.4754509925842285, 0.521479606628418, 0.5675081610679626, 0.6135367155075073, 0.659565269947052, 0.7055938243865967, 0.7516224384307861, 0.7976509928703308, 0.8436795473098755, 0.8897081613540649, 0.9357367157936096, 0.9817652702331543, 1.0277938842773438, 1.0738223791122437, 1.119850993156433, 1.165879487991333, 1.2119081020355225, 1.257936716079712, 1.3039653301239014, 1.3499938249588013]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 9.0, 14.0, 13.0, 15.0, 31.0, 49.0, 70.0, 99.0, 140.0, 189.0, 276.0, 409.0, 647.0, 926.0, 1400.0, 2068.0, 3094.0, 4804.0, 7218.0, 11352.0, 18250.0, 30552.0, 53246.0, 98688.0, 215969.0, 298494.0, 132675.0, 67695.0, 38112.0, 22592.0, 14006.0, 8866.0, 5561.0, 3667.0, 2368.0, 1599.0, 1088.0, 708.0, 534.0, 342.0, 223.0, 165.0, 118.0, 88.0, 55.0, 19.0, 19.0, 18.0, 8.0, 4.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.47998046875, -0.464599609375, -0.44921875, -0.433837890625, -0.41845703125, -0.403076171875, -0.3876953125, -0.372314453125, -0.35693359375, -0.341552734375, -0.326171875, -0.310791015625, -0.29541015625, -0.280029296875, -0.2646484375, -0.249267578125, -0.23388671875, -0.218505859375, -0.203125, -0.187744140625, -0.17236328125, -0.156982421875, -0.1416015625, -0.126220703125, -0.11083984375, -0.095458984375, -0.080078125, -0.064697265625, -0.04931640625, -0.033935546875, -0.0185546875, -0.003173828125, 0.01220703125, 0.027587890625, 0.04296875, 0.058349609375, 0.07373046875, 0.089111328125, 0.1044921875, 0.119873046875, 0.13525390625, 0.150634765625, 0.166015625, 0.181396484375, 0.19677734375, 0.212158203125, 0.2275390625, 0.242919921875, 0.25830078125, 0.273681640625, 0.2890625, 0.304443359375, 0.31982421875, 0.335205078125, 0.3505859375, 0.365966796875, 0.38134765625, 0.396728515625, 0.412109375, 0.427490234375, 0.44287109375, 0.458251953125, 0.4736328125, 0.489013671875, 0.50439453125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 5.0, 8.0, 5.0, 5.0, 9.0, 8.0, 16.0, 16.0, 12.0, 15.0, 20.0, 26.0, 24.0, 25.0, 36.0, 20.0, 28.0, 36.0, 29.0, 28.0, 34.0, 39.0, 35.0, 49.0, 30.0, 37.0, 31.0, 31.0, 28.0, 39.0, 29.0, 28.0, 31.0, 27.0, 26.0, 20.0, 18.0, 11.0, 14.0, 13.0, 6.0, 9.0, 5.0, 11.0, 4.0, 3.0, 8.0, 1.0, 6.0, 3.0, 5.0, 0.0, 0.0, 0.0, 2.0, 4.0], "bins": [-1.3525390625, -1.3093109130859375, -1.266082763671875, -1.2228546142578125, -1.17962646484375, -1.1363983154296875, -1.093170166015625, -1.0499420166015625, -1.0067138671875, -0.9634857177734375, -0.920257568359375, -0.8770294189453125, -0.83380126953125, -0.7905731201171875, -0.747344970703125, -0.7041168212890625, -0.660888671875, -0.6176605224609375, -0.574432373046875, -0.5312042236328125, -0.48797607421875, -0.4447479248046875, -0.401519775390625, -0.3582916259765625, -0.3150634765625, -0.2718353271484375, -0.228607177734375, -0.1853790283203125, -0.14215087890625, -0.0989227294921875, -0.055694580078125, -0.0124664306640625, 0.03076171875, 0.0739898681640625, 0.117218017578125, 0.1604461669921875, 0.20367431640625, 0.2469024658203125, 0.290130615234375, 0.3333587646484375, 0.3765869140625, 0.4198150634765625, 0.463043212890625, 0.5062713623046875, 0.54949951171875, 0.5927276611328125, 0.635955810546875, 0.6791839599609375, 0.722412109375, 0.7656402587890625, 0.808868408203125, 0.8520965576171875, 0.89532470703125, 0.9385528564453125, 0.981781005859375, 1.0250091552734375, 1.0682373046875, 1.1114654541015625, 1.154693603515625, 1.1979217529296875, 1.24114990234375, 1.2843780517578125, 1.327606201171875, 1.3708343505859375, 1.4140625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 4.0, 0.0, 5.0, 13.0, 6.0, 14.0, 19.0, 36.0, 35.0, 50.0, 71.0, 104.0, 143.0, 249.0, 321.0, 527.0, 729.0, 1252.0, 2041.0, 3405.0, 6239.0, 11366.0, 23061.0, 50227.0, 135179.0, 475749.0, 207394.0, 67945.0, 29411.0, 14393.0, 7662.0, 4332.0, 2444.0, 1436.0, 939.0, 608.0, 340.0, 248.0, 209.0, 106.0, 75.0, 52.0, 38.0, 30.0, 11.0, 13.0, 11.0, 9.0, 4.0, 6.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.8876953125, -0.8628082275390625, -0.837921142578125, -0.8130340576171875, -0.78814697265625, -0.7632598876953125, -0.738372802734375, -0.7134857177734375, -0.6885986328125, -0.6637115478515625, -0.638824462890625, -0.6139373779296875, -0.58905029296875, -0.5641632080078125, -0.539276123046875, -0.5143890380859375, -0.489501953125, -0.4646148681640625, -0.439727783203125, -0.4148406982421875, -0.38995361328125, -0.3650665283203125, -0.340179443359375, -0.3152923583984375, -0.2904052734375, -0.2655181884765625, -0.240631103515625, -0.2157440185546875, -0.19085693359375, -0.1659698486328125, -0.141082763671875, -0.1161956787109375, -0.09130859375, -0.0664215087890625, -0.041534423828125, -0.0166473388671875, 0.00823974609375, 0.0331268310546875, 0.058013916015625, 0.0829010009765625, 0.1077880859375, 0.1326751708984375, 0.157562255859375, 0.1824493408203125, 0.20733642578125, 0.2322235107421875, 0.257110595703125, 0.2819976806640625, 0.306884765625, 0.3317718505859375, 0.356658935546875, 0.3815460205078125, 0.40643310546875, 0.4313201904296875, 0.456207275390625, 0.4810943603515625, 0.5059814453125, 0.5308685302734375, 0.555755615234375, 0.5806427001953125, 0.60552978515625, 0.6304168701171875, 0.655303955078125, 0.6801910400390625, 0.705078125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 1.0, 8.0, 7.0, 9.0, 10.0, 17.0, 10.0, 10.0, 16.0, 21.0, 21.0, 22.0, 37.0, 26.0, 33.0, 27.0, 38.0, 43.0, 44.0, 44.0, 30.0, 44.0, 53.0, 46.0, 54.0, 46.0, 24.0, 33.0, 29.0, 31.0, 31.0, 17.0, 20.0, 12.0, 18.0, 14.0, 7.0, 8.0, 15.0, 7.0, 6.0, 6.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8681640625, -0.8363800048828125, -0.804595947265625, -0.7728118896484375, -0.74102783203125, -0.7092437744140625, -0.677459716796875, -0.6456756591796875, -0.6138916015625, -0.5821075439453125, -0.550323486328125, -0.5185394287109375, -0.48675537109375, -0.4549713134765625, -0.423187255859375, -0.3914031982421875, -0.359619140625, -0.3278350830078125, -0.296051025390625, -0.2642669677734375, -0.23248291015625, -0.2006988525390625, -0.168914794921875, -0.1371307373046875, -0.1053466796875, -0.0735626220703125, -0.041778564453125, -0.0099945068359375, 0.02178955078125, 0.0535736083984375, 0.085357666015625, 0.1171417236328125, 0.14892578125, 0.1807098388671875, 0.212493896484375, 0.2442779541015625, 0.27606201171875, 0.3078460693359375, 0.339630126953125, 0.3714141845703125, 0.4031982421875, 0.4349822998046875, 0.466766357421875, 0.4985504150390625, 0.53033447265625, 0.5621185302734375, 0.593902587890625, 0.6256866455078125, 0.657470703125, 0.6892547607421875, 0.721038818359375, 0.7528228759765625, 0.78460693359375, 0.8163909912109375, 0.848175048828125, 0.8799591064453125, 0.9117431640625, 0.9435272216796875, 0.975311279296875, 1.0070953369140625, 1.03887939453125, 1.0706634521484375, 1.102447509765625, 1.1342315673828125, 1.166015625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 11.0, 10.0, 16.0, 24.0, 33.0, 47.0, 46.0, 74.0, 124.0, 200.0, 250.0, 366.0, 518.0, 826.0, 1325.0, 2032.0, 3418.0, 6029.0, 11109.0, 22316.0, 55353.0, 280021.0, 540618.0, 68483.0, 26005.0, 12486.0, 6721.0, 3742.0, 2245.0, 1341.0, 881.0, 595.0, 394.0, 267.0, 170.0, 106.0, 90.0, 84.0, 48.0, 38.0, 22.0, 20.0, 13.0, 7.0, 5.0, 4.0, 11.0, 5.0, 3.0, 1.0, 4.0, 2.0], "bins": [-0.08551025390625, -0.08300209045410156, -0.08049392700195312, -0.07798576354980469, -0.07547760009765625, -0.07296943664550781, -0.07046127319335938, -0.06795310974121094, -0.0654449462890625, -0.06293678283691406, -0.060428619384765625, -0.05792045593261719, -0.05541229248046875, -0.05290412902832031, -0.050395965576171875, -0.04788780212402344, -0.045379638671875, -0.04287147521972656, -0.040363311767578125, -0.03785514831542969, -0.03534698486328125, -0.03283882141113281, -0.030330657958984375, -0.027822494506835938, -0.0253143310546875, -0.022806167602539062, -0.020298004150390625, -0.017789840698242188, -0.01528167724609375, -0.012773513793945312, -0.010265350341796875, -0.0077571868896484375, -0.0052490234375, -0.0027408599853515625, -0.000232696533203125, 0.0022754669189453125, 0.00478363037109375, 0.0072917938232421875, 0.009799957275390625, 0.012308120727539062, 0.0148162841796875, 0.017324447631835938, 0.019832611083984375, 0.022340774536132812, 0.02484893798828125, 0.027357101440429688, 0.029865264892578125, 0.03237342834472656, 0.034881591796875, 0.03738975524902344, 0.039897918701171875, 0.04240608215332031, 0.04491424560546875, 0.04742240905761719, 0.049930572509765625, 0.05243873596191406, 0.0549468994140625, 0.05745506286621094, 0.059963226318359375, 0.06247138977050781, 0.06497955322265625, 0.06748771667480469, 0.06999588012695312, 0.07250404357910156, 0.07501220703125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 6.0, 3.0, 1.0, 8.0, 2.0, 4.0, 5.0, 12.0, 15.0, 16.0, 35.0, 63.0, 77.0, 73.0, 202.0, 155.0, 77.0, 94.0, 51.0, 28.0, 28.0, 15.0, 11.0, 10.0, 5.0, 4.0, 7.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.119510650634766e-06, -8.841976523399353e-06, -8.56444239616394e-06, -8.286908268928528e-06, -8.009374141693115e-06, -7.731840014457703e-06, -7.45430588722229e-06, -7.1767717599868774e-06, -6.899237632751465e-06, -6.621703505516052e-06, -6.34416937828064e-06, -6.066635251045227e-06, -5.7891011238098145e-06, -5.511566996574402e-06, -5.234032869338989e-06, -4.956498742103577e-06, -4.678964614868164e-06, -4.4014304876327515e-06, -4.123896360397339e-06, -3.846362233161926e-06, -3.5688281059265137e-06, -3.291293978691101e-06, -3.0137598514556885e-06, -2.736225724220276e-06, -2.4586915969848633e-06, -2.1811574697494507e-06, -1.903623342514038e-06, -1.6260892152786255e-06, -1.3485550880432129e-06, -1.0710209608078003e-06, -7.934868335723877e-07, -5.159527063369751e-07, -2.384185791015625e-07, 3.91155481338501e-08, 3.166496753692627e-07, 5.941838026046753e-07, 8.717179298400879e-07, 1.1492520570755005e-06, 1.426786184310913e-06, 1.7043203115463257e-06, 1.9818544387817383e-06, 2.259388566017151e-06, 2.5369226932525635e-06, 2.814456820487976e-06, 3.0919909477233887e-06, 3.3695250749588013e-06, 3.647059202194214e-06, 3.9245933294296265e-06, 4.202127456665039e-06, 4.479661583900452e-06, 4.757195711135864e-06, 5.034729838371277e-06, 5.3122639656066895e-06, 5.589798092842102e-06, 5.867332220077515e-06, 6.144866347312927e-06, 6.42240047454834e-06, 6.6999346017837524e-06, 6.977468729019165e-06, 7.255002856254578e-06, 7.53253698348999e-06, 7.810071110725403e-06, 8.087605237960815e-06, 8.365139365196228e-06, 8.64267349243164e-06]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 9.0, 9.0, 13.0, 14.0, 32.0, 36.0, 35.0, 72.0, 78.0, 136.0, 167.0, 251.0, 351.0, 529.0, 721.0, 1171.0, 1723.0, 2872.0, 4840.0, 8680.0, 16790.0, 36770.0, 101042.0, 585712.0, 183382.0, 53371.0, 22671.0, 11077.0, 5944.0, 3510.0, 2173.0, 1416.0, 902.0, 614.0, 436.0, 290.0, 189.0, 165.0, 107.0, 77.0, 53.0, 45.0, 26.0, 14.0, 11.0, 10.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.101318359375, -0.09812259674072266, -0.09492683410644531, -0.09173107147216797, -0.08853530883789062, -0.08533954620361328, -0.08214378356933594, -0.0789480209350586, -0.07575225830078125, -0.0725564956665039, -0.06936073303222656, -0.06616497039794922, -0.06296920776367188, -0.05977344512939453, -0.05657768249511719, -0.053381919860839844, -0.0501861572265625, -0.046990394592285156, -0.04379463195800781, -0.04059886932373047, -0.037403106689453125, -0.03420734405517578, -0.031011581420898438, -0.027815818786621094, -0.02462005615234375, -0.021424293518066406, -0.018228530883789062, -0.015032768249511719, -0.011837005615234375, -0.008641242980957031, -0.0054454803466796875, -0.0022497177124023438, 0.000946044921875, 0.004141807556152344, 0.0073375701904296875, 0.010533332824707031, 0.013729095458984375, 0.01692485809326172, 0.020120620727539062, 0.023316383361816406, 0.02651214599609375, 0.029707908630371094, 0.03290367126464844, 0.03609943389892578, 0.039295196533203125, 0.04249095916748047, 0.04568672180175781, 0.048882484436035156, 0.0520782470703125, 0.055274009704589844, 0.05846977233886719, 0.06166553497314453, 0.06486129760742188, 0.06805706024169922, 0.07125282287597656, 0.0744485855102539, 0.07764434814453125, 0.0808401107788086, 0.08403587341308594, 0.08723163604736328, 0.09042739868164062, 0.09362316131591797, 0.09681892395019531, 0.10001468658447266, 0.10321044921875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 3.0, 4.0, 5.0, 5.0, 5.0, 10.0, 15.0, 17.0, 13.0, 11.0, 21.0, 19.0, 18.0, 37.0, 42.0, 52.0, 83.0, 91.0, 106.0, 98.0, 72.0, 46.0, 38.0, 30.0, 23.0, 31.0, 12.0, 18.0, 14.0, 10.0, 10.0, 7.0, 2.0, 6.0, 4.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0311431884765625, -0.030178308486938477, -0.029213428497314453, -0.02824854850769043, -0.027283668518066406, -0.026318788528442383, -0.02535390853881836, -0.024389028549194336, -0.023424148559570312, -0.02245926856994629, -0.021494388580322266, -0.020529508590698242, -0.01956462860107422, -0.018599748611450195, -0.017634868621826172, -0.01666998863220215, -0.015705108642578125, -0.014740228652954102, -0.013775348663330078, -0.012810468673706055, -0.011845588684082031, -0.010880708694458008, -0.009915828704833984, -0.008950948715209961, -0.007986068725585938, -0.007021188735961914, -0.006056308746337891, -0.005091428756713867, -0.004126548767089844, -0.0031616687774658203, -0.002196788787841797, -0.0012319087982177734, -0.00026702880859375, 0.0006978511810302734, 0.0016627311706542969, 0.0026276111602783203, 0.0035924911499023438, 0.004557371139526367, 0.005522251129150391, 0.006487131118774414, 0.0074520111083984375, 0.008416891098022461, 0.009381771087646484, 0.010346651077270508, 0.011311531066894531, 0.012276411056518555, 0.013241291046142578, 0.014206171035766602, 0.015171051025390625, 0.01613593101501465, 0.017100811004638672, 0.018065690994262695, 0.01903057098388672, 0.019995450973510742, 0.020960330963134766, 0.02192521095275879, 0.022890090942382812, 0.023854970932006836, 0.02481985092163086, 0.025784730911254883, 0.026749610900878906, 0.02771449089050293, 0.028679370880126953, 0.029644250869750977, 0.030609130859375]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 3.0, 4.0, 7.0, 4.0, 8.0, 14.0, 16.0, 19.0, 19.0, 27.0, 33.0, 56.0, 54.0, 84.0, 96.0, 86.0, 92.0, 74.0, 89.0, 41.0, 34.0, 22.0, 33.0, 16.0, 14.0, 15.0, 11.0, 4.0, 1.0, 3.0, 4.0, 4.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7598187923431396, -1.6958844661712646, -1.6319502592086792, -1.5680160522460938, -1.5040817260742188, -1.4401473999023438, -1.3762131929397583, -1.3122789859771729, -1.2483446598052979, -1.1844103336334229, -1.1204761266708374, -1.056541919708252, -0.992607593536377, -0.9286733269691467, -0.8647390604019165, -0.8008047938346863, -0.736870527267456, -0.6729362607002258, -0.6090019941329956, -0.5450677275657654, -0.48113346099853516, -0.41719919443130493, -0.3532649278640747, -0.2893306612968445, -0.22539639472961426, -0.16146212816238403, -0.09752786159515381, -0.033593595027923584, 0.03034067153930664, 0.09427493810653687, 0.1582092046737671, 0.22214347124099731, 0.28607797622680664, 0.35001224279403687, 0.4139465093612671, 0.4778807759284973, 0.5418150424957275, 0.6057493090629578, 0.669683575630188, 0.7336178421974182, 0.7975521087646484, 0.8614863753318787, 0.9254206418991089, 0.9893549084663391, 1.0532891750335693, 1.1172235012054443, 1.1811577081680298, 1.2450919151306152, 1.3090262413024902, 1.3729605674743652, 1.4368947744369507, 1.5008289813995361, 1.5647633075714111, 1.6286976337432861, 1.6926318407058716, 1.756566047668457, 1.820500373840332, 1.884434700012207, 1.9483689069747925, 2.012303113937378, 2.076237440109253, 2.140171766281128, 2.204105854034424, 2.268040180206299, 2.331974506378174]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 12.0, 3.0, 8.0, 9.0, 12.0, 12.0, 16.0, 19.0, 16.0, 25.0, 29.0, 36.0, 30.0, 24.0, 28.0, 31.0, 38.0, 34.0, 40.0, 40.0, 41.0, 31.0, 45.0, 37.0, 38.0, 34.0, 39.0, 26.0, 39.0, 26.0, 39.0, 21.0, 15.0, 19.0, 18.0, 10.0, 11.0, 8.0, 8.0, 6.0, 6.0, 7.0, 9.0, 1.0, 2.0, 3.0, 0.0, 5.0, 0.0, 1.0], "bins": [-1.6028246879577637, -1.556752324104309, -1.5106799602508545, -1.4646075963974, -1.4185352325439453, -1.3724628686904907, -1.3263905048370361, -1.280318021774292, -1.234245777130127, -1.1881734132766724, -1.1421010494232178, -1.0960286855697632, -1.0499563217163086, -1.003883957862854, -0.9578115344047546, -0.9117391705513, -0.8656667470932007, -0.8195943832397461, -0.7735220193862915, -0.7274496555328369, -0.6813772916793823, -0.6353049278259277, -0.5892325043678284, -0.5431601405143738, -0.4970877766609192, -0.4510154128074646, -0.40494304895401, -0.35887065529823303, -0.31279829144477844, -0.26672592759132385, -0.22065353393554688, -0.17458117008209229, -0.1285088062286377, -0.08243643492460251, -0.03636406362056732, 0.009708315134048462, 0.05578067898750305, 0.10185304284095764, 0.14792543649673462, 0.1939978003501892, 0.2400701642036438, 0.2861425280570984, 0.332214891910553, 0.37828728556632996, 0.42435964941978455, 0.47043201327323914, 0.5165044069290161, 0.5625767707824707, 0.6086491346359253, 0.6547214984893799, 0.7007938623428345, 0.7468662261962891, 0.7929385900497437, 0.8390109539031982, 0.8850833773612976, 0.9311557412147522, 0.9772281050682068, 1.0233005285263062, 1.0693728923797607, 1.1154452562332153, 1.16151762008667, 1.2075899839401245, 1.253662347793579, 1.2997347116470337, 1.3458070755004883]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 6.0, 7.0, 12.0, 20.0, 31.0, 37.0, 70.0, 96.0, 134.0, 245.0, 355.0, 546.0, 851.0, 1327.0, 1893.0, 3242.0, 4980.0, 8068.0, 13179.0, 21934.0, 37568.0, 68788.0, 130364.0, 244786.0, 233675.0, 121952.0, 64636.0, 36087.0, 20509.0, 12308.0, 7727.0, 4703.0, 2908.0, 1942.0, 1236.0, 800.0, 500.0, 339.0, 216.0, 166.0, 99.0, 82.0, 39.0, 44.0, 20.0, 7.0, 5.0, 5.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-2.8046875, -2.722076416015625, -2.63946533203125, -2.556854248046875, -2.4742431640625, -2.391632080078125, -2.30902099609375, -2.226409912109375, -2.143798828125, -2.061187744140625, -1.97857666015625, -1.895965576171875, -1.8133544921875, -1.730743408203125, -1.64813232421875, -1.565521240234375, -1.48291015625, -1.400299072265625, -1.31768798828125, -1.235076904296875, -1.1524658203125, -1.069854736328125, -0.98724365234375, -0.904632568359375, -0.822021484375, -0.739410400390625, -0.65679931640625, -0.574188232421875, -0.4915771484375, -0.408966064453125, -0.32635498046875, -0.243743896484375, -0.1611328125, -0.078521728515625, 0.00408935546875, 0.086700439453125, 0.1693115234375, 0.251922607421875, 0.33453369140625, 0.417144775390625, 0.499755859375, 0.582366943359375, 0.66497802734375, 0.747589111328125, 0.8302001953125, 0.912811279296875, 0.99542236328125, 1.078033447265625, 1.16064453125, 1.243255615234375, 1.32586669921875, 1.408477783203125, 1.4910888671875, 1.573699951171875, 1.65631103515625, 1.738922119140625, 1.821533203125, 1.904144287109375, 1.98675537109375, 2.069366455078125, 2.1519775390625, 2.234588623046875, 2.31719970703125, 2.399810791015625, 2.482421875]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 4.0, 8.0, 6.0, 9.0, 14.0, 7.0, 19.0, 18.0, 23.0, 31.0, 33.0, 30.0, 33.0, 29.0, 34.0, 34.0, 50.0, 36.0, 30.0, 39.0, 45.0, 36.0, 45.0, 42.0, 42.0, 30.0, 37.0, 34.0, 32.0, 31.0, 21.0, 27.0, 19.0, 15.0, 12.0, 15.0, 8.0, 4.0, 2.0, 5.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4951171875, -1.4512939453125, -1.407470703125, -1.3636474609375, -1.31982421875, -1.2760009765625, -1.232177734375, -1.1883544921875, -1.14453125, -1.1007080078125, -1.056884765625, -1.0130615234375, -0.96923828125, -0.9254150390625, -0.881591796875, -0.8377685546875, -0.7939453125, -0.7501220703125, -0.706298828125, -0.6624755859375, -0.61865234375, -0.5748291015625, -0.531005859375, -0.4871826171875, -0.443359375, -0.3995361328125, -0.355712890625, -0.3118896484375, -0.26806640625, -0.2242431640625, -0.180419921875, -0.1365966796875, -0.0927734375, -0.0489501953125, -0.005126953125, 0.0386962890625, 0.08251953125, 0.1263427734375, 0.170166015625, 0.2139892578125, 0.2578125, 0.3016357421875, 0.345458984375, 0.3892822265625, 0.43310546875, 0.4769287109375, 0.520751953125, 0.5645751953125, 0.6083984375, 0.6522216796875, 0.696044921875, 0.7398681640625, 0.78369140625, 0.8275146484375, 0.871337890625, 0.9151611328125, 0.958984375, 1.0028076171875, 1.046630859375, 1.0904541015625, 1.13427734375, 1.1781005859375, 1.221923828125, 1.2657470703125, 1.3095703125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 5.0, 5.0, 18.0, 15.0, 25.0, 35.0, 52.0, 61.0, 97.0, 132.0, 176.0, 254.0, 331.0, 491.0, 742.0, 1006.0, 1483.0, 2120.0, 3075.0, 4601.0, 6953.0, 10318.0, 15673.0, 23811.0, 36878.0, 57095.0, 89184.0, 146638.0, 218704.0, 157706.0, 95912.0, 60036.0, 39274.0, 25532.0, 16541.0, 10735.0, 7204.0, 4894.0, 3324.0, 2238.0, 1574.0, 1082.0, 753.0, 531.0, 355.0, 271.0, 178.0, 122.0, 101.0, 59.0, 54.0, 29.0, 30.0, 13.0, 13.0, 11.0, 8.0, 3.0, 3.0, 0.0, 2.0], "bins": [-1.927734375, -1.866668701171875, -1.80560302734375, -1.744537353515625, -1.6834716796875, -1.622406005859375, -1.56134033203125, -1.500274658203125, -1.439208984375, -1.378143310546875, -1.31707763671875, -1.256011962890625, -1.1949462890625, -1.133880615234375, -1.07281494140625, -1.011749267578125, -0.95068359375, -0.889617919921875, -0.82855224609375, -0.767486572265625, -0.7064208984375, -0.645355224609375, -0.58428955078125, -0.523223876953125, -0.462158203125, -0.401092529296875, -0.34002685546875, -0.278961181640625, -0.2178955078125, -0.156829833984375, -0.09576416015625, -0.034698486328125, 0.0263671875, 0.087432861328125, 0.14849853515625, 0.209564208984375, 0.2706298828125, 0.331695556640625, 0.39276123046875, 0.453826904296875, 0.514892578125, 0.575958251953125, 0.63702392578125, 0.698089599609375, 0.7591552734375, 0.820220947265625, 0.88128662109375, 0.942352294921875, 1.00341796875, 1.064483642578125, 1.12554931640625, 1.186614990234375, 1.2476806640625, 1.308746337890625, 1.36981201171875, 1.430877685546875, 1.491943359375, 1.553009033203125, 1.61407470703125, 1.675140380859375, 1.7362060546875, 1.797271728515625, 1.85833740234375, 1.919403076171875, 1.98046875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 5.0, 3.0, 7.0, 7.0, 7.0, 9.0, 7.0, 8.0, 16.0, 15.0, 26.0, 13.0, 24.0, 13.0, 27.0, 33.0, 25.0, 34.0, 40.0, 38.0, 39.0, 36.0, 26.0, 40.0, 42.0, 30.0, 39.0, 37.0, 45.0, 35.0, 32.0, 28.0, 36.0, 26.0, 26.0, 25.0, 18.0, 13.0, 15.0, 19.0, 9.0, 6.0, 6.0, 4.0, 3.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.82373046875, -0.798370361328125, -0.77301025390625, -0.747650146484375, -0.7222900390625, -0.696929931640625, -0.67156982421875, -0.646209716796875, -0.620849609375, -0.595489501953125, -0.57012939453125, -0.544769287109375, -0.5194091796875, -0.494049072265625, -0.46868896484375, -0.443328857421875, -0.41796875, -0.392608642578125, -0.36724853515625, -0.341888427734375, -0.3165283203125, -0.291168212890625, -0.26580810546875, -0.240447998046875, -0.215087890625, -0.189727783203125, -0.16436767578125, -0.139007568359375, -0.1136474609375, -0.088287353515625, -0.06292724609375, -0.037567138671875, -0.01220703125, 0.013153076171875, 0.03851318359375, 0.063873291015625, 0.0892333984375, 0.114593505859375, 0.13995361328125, 0.165313720703125, 0.190673828125, 0.216033935546875, 0.24139404296875, 0.266754150390625, 0.2921142578125, 0.317474365234375, 0.34283447265625, 0.368194580078125, 0.3935546875, 0.418914794921875, 0.44427490234375, 0.469635009765625, 0.4949951171875, 0.520355224609375, 0.54571533203125, 0.571075439453125, 0.596435546875, 0.621795654296875, 0.64715576171875, 0.672515869140625, 0.6978759765625, 0.723236083984375, 0.74859619140625, 0.773956298828125, 0.79931640625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 3.0, 9.0, 14.0, 18.0, 34.0, 47.0, 55.0, 96.0, 136.0, 172.0, 210.0, 362.0, 448.0, 626.0, 979.0, 1403.0, 2263.0, 3535.0, 5868.0, 10102.0, 18210.0, 37004.0, 91061.0, 601701.0, 162761.0, 53345.0, 24827.0, 13204.0, 7397.0, 4330.0, 2765.0, 1727.0, 1208.0, 772.0, 540.0, 385.0, 267.0, 187.0, 131.0, 93.0, 76.0, 42.0, 42.0, 23.0, 28.0, 18.0, 12.0, 7.0, 4.0, 5.0, 3.0, 0.0, 1.0], "bins": [-1.9345703125, -1.8788604736328125, -1.823150634765625, -1.7674407958984375, -1.71173095703125, -1.6560211181640625, -1.600311279296875, -1.5446014404296875, -1.4888916015625, -1.4331817626953125, -1.377471923828125, -1.3217620849609375, -1.26605224609375, -1.2103424072265625, -1.154632568359375, -1.0989227294921875, -1.043212890625, -0.9875030517578125, -0.931793212890625, -0.8760833740234375, -0.82037353515625, -0.7646636962890625, -0.708953857421875, -0.6532440185546875, -0.5975341796875, -0.5418243408203125, -0.486114501953125, -0.4304046630859375, -0.37469482421875, -0.3189849853515625, -0.263275146484375, -0.2075653076171875, -0.15185546875, -0.0961456298828125, -0.040435791015625, 0.0152740478515625, 0.07098388671875, 0.1266937255859375, 0.182403564453125, 0.2381134033203125, 0.2938232421875, 0.3495330810546875, 0.405242919921875, 0.4609527587890625, 0.51666259765625, 0.5723724365234375, 0.628082275390625, 0.6837921142578125, 0.739501953125, 0.7952117919921875, 0.850921630859375, 0.9066314697265625, 0.96234130859375, 1.0180511474609375, 1.073760986328125, 1.1294708251953125, 1.1851806640625, 1.2408905029296875, 1.296600341796875, 1.3523101806640625, 1.40802001953125, 1.4637298583984375, 1.519439697265625, 1.5751495361328125, 1.630859375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 9.0, 5.0, 12.0, 9.0, 14.0, 23.0, 38.0, 54.0, 114.0, 408.0, 108.0, 64.0, 36.0, 27.0, 9.0, 19.0, 15.0, 10.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011581182479858398, -0.00011200550943613052, -0.00010819919407367706, -0.0001043928787112236, -0.00010058656334877014, -9.678024798631668e-05, -9.297393262386322e-05, -8.916761726140976e-05, -8.53613018989563e-05, -8.155498653650284e-05, -7.774867117404938e-05, -7.394235581159592e-05, -7.013604044914246e-05, -6.6329725086689e-05, -6.252340972423553e-05, -5.8717094361782074e-05, -5.491077899932861e-05, -5.110446363687515e-05, -4.729814827442169e-05, -4.349183291196823e-05, -3.968551754951477e-05, -3.587920218706131e-05, -3.207288682460785e-05, -2.826657146215439e-05, -2.4460256099700928e-05, -2.0653940737247467e-05, -1.6847625374794006e-05, -1.3041310012340546e-05, -9.234994649887085e-06, -5.428679287433624e-06, -1.6223639249801636e-06, 2.183951437473297e-06, 5.990266799926758e-06, 9.796582162380219e-06, 1.360289752483368e-05, 1.740921288728714e-05, 2.12155282497406e-05, 2.502184361219406e-05, 2.8828158974647522e-05, 3.263447433710098e-05, 3.644078969955444e-05, 4.0247105062007904e-05, 4.4053420424461365e-05, 4.7859735786914825e-05, 5.1666051149368286e-05, 5.547236651182175e-05, 5.927868187427521e-05, 6.308499723672867e-05, 6.689131259918213e-05, 7.069762796163559e-05, 7.450394332408905e-05, 7.831025868654251e-05, 8.211657404899597e-05, 8.592288941144943e-05, 8.972920477390289e-05, 9.353552013635635e-05, 9.734183549880981e-05, 0.00010114815086126328, 0.00010495446622371674, 0.0001087607815861702, 0.00011256709694862366, 0.00011637341231107712, 0.00012017972767353058, 0.00012398604303598404, 0.0001277923583984375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 1.0, 9.0, 3.0, 14.0, 20.0, 22.0, 39.0, 53.0, 71.0, 91.0, 130.0, 203.0, 306.0, 444.0, 604.0, 984.0, 1431.0, 2134.0, 3252.0, 5192.0, 8134.0, 13017.0, 22384.0, 42122.0, 93149.0, 585204.0, 142728.0, 54973.0, 28019.0, 16586.0, 9732.0, 6110.0, 3901.0, 2447.0, 1670.0, 1101.0, 685.0, 480.0, 362.0, 257.0, 141.0, 105.0, 71.0, 54.0, 31.0, 33.0, 18.0, 11.0, 9.0, 4.0, 9.0, 5.0, 1.0, 2.0, 2.0], "bins": [-1.630859375, -1.5838470458984375, -1.536834716796875, -1.4898223876953125, -1.44281005859375, -1.3957977294921875, -1.348785400390625, -1.3017730712890625, -1.2547607421875, -1.2077484130859375, -1.160736083984375, -1.1137237548828125, -1.06671142578125, -1.0196990966796875, -0.972686767578125, -0.9256744384765625, -0.878662109375, -0.8316497802734375, -0.784637451171875, -0.7376251220703125, -0.69061279296875, -0.6436004638671875, -0.596588134765625, -0.5495758056640625, -0.5025634765625, -0.4555511474609375, -0.408538818359375, -0.3615264892578125, -0.31451416015625, -0.2675018310546875, -0.220489501953125, -0.1734771728515625, -0.12646484375, -0.0794525146484375, -0.032440185546875, 0.0145721435546875, 0.06158447265625, 0.1085968017578125, 0.155609130859375, 0.2026214599609375, 0.2496337890625, 0.2966461181640625, 0.343658447265625, 0.3906707763671875, 0.43768310546875, 0.4846954345703125, 0.531707763671875, 0.5787200927734375, 0.625732421875, 0.6727447509765625, 0.719757080078125, 0.7667694091796875, 0.81378173828125, 0.8607940673828125, 0.907806396484375, 0.9548187255859375, 1.0018310546875, 1.0488433837890625, 1.095855712890625, 1.1428680419921875, 1.18988037109375, 1.2368927001953125, 1.283905029296875, 1.3309173583984375, 1.3779296875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 2.0, 8.0, 3.0, 6.0, 4.0, 12.0, 14.0, 13.0, 18.0, 24.0, 21.0, 33.0, 26.0, 46.0, 52.0, 71.0, 283.0, 61.0, 44.0, 43.0, 36.0, 27.0, 23.0, 16.0, 12.0, 14.0, 18.0, 14.0, 12.0, 5.0, 9.0, 6.0, 3.0, 10.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.384765625, -0.3707122802734375, -0.356658935546875, -0.3426055908203125, -0.32855224609375, -0.3144989013671875, -0.300445556640625, -0.2863922119140625, -0.2723388671875, -0.2582855224609375, -0.244232177734375, -0.2301788330078125, -0.21612548828125, -0.2020721435546875, -0.188018798828125, -0.1739654541015625, -0.159912109375, -0.1458587646484375, -0.131805419921875, -0.1177520751953125, -0.10369873046875, -0.0896453857421875, -0.075592041015625, -0.0615386962890625, -0.0474853515625, -0.0334320068359375, -0.019378662109375, -0.0053253173828125, 0.00872802734375, 0.0227813720703125, 0.036834716796875, 0.0508880615234375, 0.06494140625, 0.0789947509765625, 0.093048095703125, 0.1071014404296875, 0.12115478515625, 0.1352081298828125, 0.149261474609375, 0.1633148193359375, 0.1773681640625, 0.1914215087890625, 0.205474853515625, 0.2195281982421875, 0.23358154296875, 0.2476348876953125, 0.261688232421875, 0.2757415771484375, 0.289794921875, 0.3038482666015625, 0.317901611328125, 0.3319549560546875, 0.34600830078125, 0.3600616455078125, 0.374114990234375, 0.3881683349609375, 0.4022216796875, 0.4162750244140625, 0.430328369140625, 0.4443817138671875, 0.45843505859375, 0.4724884033203125, 0.486541748046875, 0.5005950927734375, 0.5146484375]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 5.0, 1.0, 5.0, 4.0, 8.0, 9.0, 6.0, 8.0, 11.0, 11.0, 25.0, 30.0, 34.0, 64.0, 66.0, 104.0, 105.0, 102.0, 90.0, 61.0, 46.0, 42.0, 36.0, 33.0, 24.0, 21.0, 13.0, 10.0, 9.0, 3.0, 4.0, 5.0, 0.0, 4.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.1592559814453125, -2.095585346221924, -2.031914472579956, -1.9682437181472778, -1.9045729637145996, -1.8409022092819214, -1.7772314548492432, -1.7135608196258545, -1.6498899459838867, -1.5862191915512085, -1.5225484371185303, -1.458877682685852, -1.3952069282531738, -1.3315361738204956, -1.2678654193878174, -1.2041947841644287, -1.1405240297317505, -1.0768532752990723, -1.013182520866394, -0.9495117664337158, -0.8858410120010376, -0.8221702575683594, -0.7584995627403259, -0.6948288083076477, -0.6311580538749695, -0.5674872994422913, -0.503816545009613, -0.4401458203792572, -0.376475065946579, -0.31280431151390076, -0.24913358688354492, -0.1854628324508667, -0.12179207801818848, -0.05812133103609085, 0.005549415946006775, 0.0692201554775238, 0.13289090991020203, 0.19656166434288025, 0.2602323889732361, 0.3239031434059143, 0.38757389783859253, 0.45124465227127075, 0.514915406703949, 0.5785861015319824, 0.6422568559646606, 0.7059276103973389, 0.7695983648300171, 0.8332691192626953, 0.8969398736953735, 0.9606106281280518, 1.02428138256073, 1.0879521369934082, 1.1516228914260864, 1.2152936458587646, 1.2789642810821533, 1.342635154724121, 1.4063057899475098, 1.469976544380188, 1.5336472988128662, 1.5973180532455444, 1.6609888076782227, 1.7246595621109009, 1.788330316543579, 1.8520009517669678, 1.9156718254089355]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 12.0, 13.0, 18.0, 14.0, 13.0, 20.0, 15.0, 19.0, 31.0, 18.0, 28.0, 32.0, 26.0, 35.0, 23.0, 40.0, 40.0, 31.0, 38.0, 37.0, 34.0, 33.0, 35.0, 37.0, 40.0, 27.0, 28.0, 36.0, 33.0, 16.0, 23.0, 19.0, 15.0, 13.0, 19.0, 12.0, 20.0, 10.0, 6.0, 3.0, 4.0, 2.0, 7.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.2988865375518799, -1.2584916353225708, -1.2180967330932617, -1.1777018308639526, -1.1373069286346436, -1.096912145614624, -1.056517243385315, -1.0161223411560059, -0.9757274389266968, -0.9353325366973877, -0.8949376344680786, -0.8545427918434143, -0.8141478896141052, -0.7737529873847961, -0.7333581447601318, -0.6929632425308228, -0.6525683403015137, -0.6121734380722046, -0.5717785358428955, -0.5313836932182312, -0.4909887909889221, -0.45059388875961304, -0.41019901633262634, -0.36980414390563965, -0.32940924167633057, -0.2890143394470215, -0.2486194670200348, -0.2082245796918869, -0.167829692363739, -0.12743480503559113, -0.08703991770744324, -0.04664504528045654, -0.00625002384185791, 0.03414486348628998, 0.07453975081443787, 0.11493463814258575, 0.15532952547073364, 0.19572441279888153, 0.23611930012702942, 0.2765141725540161, 0.3169090747833252, 0.3573039770126343, 0.39769884943962097, 0.43809372186660767, 0.47848862409591675, 0.5188835263252258, 0.5592783689498901, 0.5996732711791992, 0.6400681734085083, 0.6804630756378174, 0.7208579778671265, 0.7612528204917908, 0.8016477227210999, 0.8420426249504089, 0.8824374675750732, 0.9228323698043823, 0.9632272720336914, 1.0036221742630005, 1.0440170764923096, 1.0844119787216187, 1.1248068809509277, 1.1652016639709473, 1.2055965662002563, 1.2459914684295654, 1.2863863706588745]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [4.0, 5.0, 6.0, 10.0, 9.0, 14.0, 24.0, 35.0, 57.0, 93.0, 123.0, 218.0, 322.0, 488.0, 769.0, 1338.0, 2037.0, 2956.0, 4663.0, 7211.0, 10684.0, 16751.0, 27105.0, 44292.0, 75200.0, 133573.0, 270228.0, 784324.0, 1647517.0, 651700.0, 228165.0, 115397.0, 64462.0, 38245.0, 23407.0, 14612.0, 9464.0, 6174.0, 4125.0, 2834.0, 1835.0, 1233.0, 826.0, 555.0, 399.0, 277.0, 162.0, 123.0, 78.0, 58.0, 43.0, 22.0, 22.0, 9.0, 5.0, 6.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.5927734375, -1.536712646484375, -1.48065185546875, -1.424591064453125, -1.3685302734375, -1.312469482421875, -1.25640869140625, -1.200347900390625, -1.144287109375, -1.088226318359375, -1.03216552734375, -0.976104736328125, -0.9200439453125, -0.863983154296875, -0.80792236328125, -0.751861572265625, -0.69580078125, -0.639739990234375, -0.58367919921875, -0.527618408203125, -0.4715576171875, -0.415496826171875, -0.35943603515625, -0.303375244140625, -0.247314453125, -0.191253662109375, -0.13519287109375, -0.079132080078125, -0.0230712890625, 0.032989501953125, 0.08905029296875, 0.145111083984375, 0.201171875, 0.257232666015625, 0.31329345703125, 0.369354248046875, 0.4254150390625, 0.481475830078125, 0.53753662109375, 0.593597412109375, 0.649658203125, 0.705718994140625, 0.76177978515625, 0.817840576171875, 0.8739013671875, 0.929962158203125, 0.98602294921875, 1.042083740234375, 1.09814453125, 1.154205322265625, 1.21026611328125, 1.266326904296875, 1.3223876953125, 1.378448486328125, 1.43450927734375, 1.490570068359375, 1.546630859375, 1.602691650390625, 1.65875244140625, 1.714813232421875, 1.7708740234375, 1.826934814453125, 1.88299560546875, 1.939056396484375, 1.9951171875]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 6.0, 7.0, 13.0, 11.0, 14.0, 14.0, 19.0, 6.0, 11.0, 23.0, 22.0, 28.0, 34.0, 41.0, 28.0, 23.0, 25.0, 31.0, 30.0, 41.0, 39.0, 45.0, 34.0, 40.0, 38.0, 36.0, 35.0, 28.0, 31.0, 32.0, 21.0, 39.0, 25.0, 18.0, 25.0, 19.0, 8.0, 7.0, 3.0, 15.0, 5.0, 7.0, 6.0, 3.0, 2.0, 8.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.8525390625, -0.8264389038085938, -0.8003387451171875, -0.7742385864257812, -0.748138427734375, -0.7220382690429688, -0.6959381103515625, -0.6698379516601562, -0.64373779296875, -0.6176376342773438, -0.5915374755859375, -0.5654373168945312, -0.539337158203125, -0.5132369995117188, -0.4871368408203125, -0.46103668212890625, -0.4349365234375, -0.40883636474609375, -0.3827362060546875, -0.35663604736328125, -0.330535888671875, -0.30443572998046875, -0.2783355712890625, -0.25223541259765625, -0.22613525390625, -0.20003509521484375, -0.1739349365234375, -0.14783477783203125, -0.121734619140625, -0.09563446044921875, -0.0695343017578125, -0.04343414306640625, -0.017333984375, 0.00876617431640625, 0.0348663330078125, 0.06096649169921875, 0.087066650390625, 0.11316680908203125, 0.1392669677734375, 0.16536712646484375, 0.19146728515625, 0.21756744384765625, 0.2436676025390625, 0.26976776123046875, 0.295867919921875, 0.32196807861328125, 0.3480682373046875, 0.37416839599609375, 0.4002685546875, 0.42636871337890625, 0.4524688720703125, 0.47856903076171875, 0.504669189453125, 0.5307693481445312, 0.5568695068359375, 0.5829696655273438, 0.60906982421875, 0.6351699829101562, 0.6612701416015625, 0.6873703002929688, 0.713470458984375, 0.7395706176757812, 0.7656707763671875, 0.7917709350585938, 0.81787109375]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 12.0, 16.0, 21.0, 30.0, 49.0, 84.0, 136.0, 209.0, 325.0, 488.0, 792.0, 1221.0, 1795.0, 2966.0, 4777.0, 7910.0, 13392.0, 22620.0, 40155.0, 73905.0, 139741.0, 288713.0, 697257.0, 1583305.0, 708223.0, 292310.0, 141914.0, 73909.0, 40335.0, 23026.0, 13334.0, 8096.0, 4928.0, 2994.0, 1883.0, 1241.0, 794.0, 505.0, 314.0, 196.0, 138.0, 97.0, 36.0, 39.0, 29.0, 16.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5771484375, -1.52545166015625, -1.4737548828125, -1.42205810546875, -1.370361328125, -1.31866455078125, -1.2669677734375, -1.21527099609375, -1.16357421875, -1.11187744140625, -1.0601806640625, -1.00848388671875, -0.956787109375, -0.90509033203125, -0.8533935546875, -0.80169677734375, -0.75, -0.69830322265625, -0.6466064453125, -0.59490966796875, -0.543212890625, -0.49151611328125, -0.4398193359375, -0.38812255859375, -0.33642578125, -0.28472900390625, -0.2330322265625, -0.18133544921875, -0.129638671875, -0.07794189453125, -0.0262451171875, 0.02545166015625, 0.0771484375, 0.12884521484375, 0.1805419921875, 0.23223876953125, 0.283935546875, 0.33563232421875, 0.3873291015625, 0.43902587890625, 0.49072265625, 0.54241943359375, 0.5941162109375, 0.64581298828125, 0.697509765625, 0.74920654296875, 0.8009033203125, 0.85260009765625, 0.904296875, 0.95599365234375, 1.0076904296875, 1.05938720703125, 1.111083984375, 1.16278076171875, 1.2144775390625, 1.26617431640625, 1.31787109375, 1.36956787109375, 1.4212646484375, 1.47296142578125, 1.524658203125, 1.57635498046875, 1.6280517578125, 1.67974853515625, 1.7314453125]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 5.0, 4.0, 12.0, 11.0, 15.0, 20.0, 34.0, 24.0, 48.0, 53.0, 68.0, 72.0, 87.0, 93.0, 113.0, 153.0, 170.0, 180.0, 198.0, 263.0, 234.0, 261.0, 267.0, 229.0, 223.0, 199.0, 158.0, 157.0, 162.0, 118.0, 87.0, 62.0, 56.0, 60.0, 44.0, 23.0, 25.0, 18.0, 13.0, 13.0, 13.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.4423828125, -0.4275665283203125, -0.412750244140625, -0.3979339599609375, -0.38311767578125, -0.3683013916015625, -0.353485107421875, -0.3386688232421875, -0.3238525390625, -0.3090362548828125, -0.294219970703125, -0.2794036865234375, -0.26458740234375, -0.2497711181640625, -0.234954833984375, -0.2201385498046875, -0.205322265625, -0.1905059814453125, -0.175689697265625, -0.1608734130859375, -0.14605712890625, -0.1312408447265625, -0.116424560546875, -0.1016082763671875, -0.0867919921875, -0.0719757080078125, -0.057159423828125, -0.0423431396484375, -0.02752685546875, -0.0127105712890625, 0.002105712890625, 0.0169219970703125, 0.03173828125, 0.0465545654296875, 0.061370849609375, 0.0761871337890625, 0.09100341796875, 0.1058197021484375, 0.120635986328125, 0.1354522705078125, 0.1502685546875, 0.1650848388671875, 0.179901123046875, 0.1947174072265625, 0.20953369140625, 0.2243499755859375, 0.239166259765625, 0.2539825439453125, 0.268798828125, 0.2836151123046875, 0.298431396484375, 0.3132476806640625, 0.32806396484375, 0.3428802490234375, 0.357696533203125, 0.3725128173828125, 0.3873291015625, 0.4021453857421875, 0.416961669921875, 0.4317779541015625, 0.44659423828125, 0.4614105224609375, 0.476226806640625, 0.4910430908203125, 0.505859375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 6.0, 6.0, 6.0, 7.0, 15.0, 10.0, 20.0, 29.0, 32.0, 34.0, 52.0, 66.0, 85.0, 92.0, 125.0, 82.0, 67.0, 56.0, 46.0, 29.0, 25.0, 23.0, 18.0, 12.0, 16.0, 10.0, 7.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6125956773757935, -1.5666866302490234, -1.520777702331543, -1.474868655204773, -1.428959608078003, -1.383050560951233, -1.337141513824463, -1.2912325859069824, -1.2453235387802124, -1.1994144916534424, -1.153505563735962, -1.107596516609192, -1.0616874694824219, -1.0157784223556519, -0.9698694348335266, -0.9239604473114014, -0.8780514001846313, -0.8321423530578613, -0.7862333655357361, -0.7403243780136108, -0.6944153308868408, -0.6485062837600708, -0.6025972962379456, -0.5566883087158203, -0.5107792615890503, -0.46487024426460266, -0.41896122694015503, -0.3730522096157074, -0.32714319229125977, -0.28123417496681213, -0.2353251576423645, -0.18941614031791687, -0.14350712299346924, -0.0975981056690216, -0.051689088344573975, -0.005780071020126343, 0.04012894630432129, 0.08603796362876892, 0.13194698095321655, 0.17785599827766418, 0.22376501560211182, 0.26967403292655945, 0.3155830502510071, 0.3614920675754547, 0.40740108489990234, 0.45331010222435, 0.4992191195487976, 0.5451281070709229, 0.5910371541976929, 0.6369462013244629, 0.6828551888465881, 0.7287641763687134, 0.7746732234954834, 0.8205822706222534, 0.8664912581443787, 0.9124002456665039, 0.9583092927932739, 1.004218339920044, 1.0501272678375244, 1.0960363149642944, 1.1419453620910645, 1.1878544092178345, 1.2337634563446045, 1.279672384262085, 1.325581431388855]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 6.0, 10.0, 11.0, 11.0, 12.0, 23.0, 15.0, 19.0, 15.0, 26.0, 38.0, 31.0, 22.0, 30.0, 45.0, 37.0, 32.0, 36.0, 45.0, 34.0, 25.0, 32.0, 31.0, 25.0, 26.0, 34.0, 28.0, 33.0, 32.0, 28.0, 30.0, 17.0, 25.0, 13.0, 20.0, 15.0, 15.0, 12.0, 12.0, 12.0, 3.0, 7.0, 5.0, 8.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.8729379773139954, -0.8449516296386719, -0.8169652223587036, -0.7889788746833801, -0.7609925270080566, -0.7330061197280884, -0.7050197720527649, -0.6770334243774414, -0.6490470170974731, -0.6210606694221497, -0.5930742621421814, -0.5650879144668579, -0.5371015071868896, -0.5091151595115662, -0.4811288118362427, -0.4531424343585968, -0.4251560568809509, -0.39716967940330505, -0.3691833019256592, -0.3411969542503357, -0.3132105767726898, -0.28522419929504395, -0.25723785161972046, -0.22925147414207458, -0.2012650966644287, -0.17327871918678284, -0.14529235661029816, -0.11730598658323288, -0.0893196165561676, -0.06133323907852173, -0.03334687650203705, -0.005360513925552368, 0.02262592315673828, 0.05061229318380356, 0.07859866321086884, 0.10658503323793411, 0.1345714032649994, 0.16255778074264526, 0.19054414331912994, 0.21853050589561462, 0.2465168833732605, 0.27450326085090637, 0.30248963832855225, 0.33047598600387573, 0.3584623634815216, 0.3864487409591675, 0.41443508863449097, 0.44242146611213684, 0.4704078435897827, 0.4983942210674286, 0.5263805985450745, 0.554366946220398, 0.5823533535003662, 0.6103397011756897, 0.6383260488510132, 0.6663124561309814, 0.6942988038063049, 0.7222851514816284, 0.7502715587615967, 0.7782579064369202, 0.8062442541122437, 0.8342306613922119, 0.8622170090675354, 0.8902033567428589, 0.9181897640228271]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 9.0, 15.0, 20.0, 26.0, 46.0, 58.0, 106.0, 136.0, 219.0, 320.0, 510.0, 805.0, 1202.0, 1802.0, 2938.0, 4744.0, 7622.0, 12719.0, 21785.0, 37917.0, 70670.0, 141904.0, 312621.0, 209885.0, 98090.0, 51418.0, 28513.0, 16313.0, 9907.0, 6006.0, 3639.0, 2311.0, 1496.0, 974.0, 661.0, 378.0, 257.0, 172.0, 115.0, 79.0, 52.0, 34.0, 19.0, 12.0, 11.0, 8.0, 4.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37060546875, -0.358551025390625, -0.34649658203125, -0.334442138671875, -0.3223876953125, -0.310333251953125, -0.29827880859375, -0.286224365234375, -0.274169921875, -0.262115478515625, -0.25006103515625, -0.238006591796875, -0.2259521484375, -0.213897705078125, -0.20184326171875, -0.189788818359375, -0.177734375, -0.165679931640625, -0.15362548828125, -0.141571044921875, -0.1295166015625, -0.117462158203125, -0.10540771484375, -0.093353271484375, -0.081298828125, -0.069244384765625, -0.05718994140625, -0.045135498046875, -0.0330810546875, -0.021026611328125, -0.00897216796875, 0.003082275390625, 0.01513671875, 0.027191162109375, 0.03924560546875, 0.051300048828125, 0.0633544921875, 0.075408935546875, 0.08746337890625, 0.099517822265625, 0.111572265625, 0.123626708984375, 0.13568115234375, 0.147735595703125, 0.1597900390625, 0.171844482421875, 0.18389892578125, 0.195953369140625, 0.2080078125, 0.220062255859375, 0.23211669921875, 0.244171142578125, 0.2562255859375, 0.268280029296875, 0.28033447265625, 0.292388916015625, 0.304443359375, 0.316497802734375, 0.32855224609375, 0.340606689453125, 0.3526611328125, 0.364715576171875, 0.37677001953125, 0.388824462890625, 0.40087890625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 7.0, 3.0, 10.0, 9.0, 14.0, 14.0, 16.0, 18.0, 18.0, 29.0, 23.0, 31.0, 32.0, 30.0, 40.0, 35.0, 45.0, 46.0, 36.0, 39.0, 36.0, 36.0, 37.0, 30.0, 38.0, 32.0, 35.0, 19.0, 34.0, 36.0, 24.0, 22.0, 19.0, 15.0, 12.0, 18.0, 17.0, 6.0, 8.0, 8.0, 5.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0263671875, -0.994659423828125, -0.96295166015625, -0.931243896484375, -0.8995361328125, -0.867828369140625, -0.83612060546875, -0.804412841796875, -0.772705078125, -0.740997314453125, -0.70928955078125, -0.677581787109375, -0.6458740234375, -0.614166259765625, -0.58245849609375, -0.550750732421875, -0.51904296875, -0.487335205078125, -0.45562744140625, -0.423919677734375, -0.3922119140625, -0.360504150390625, -0.32879638671875, -0.297088623046875, -0.265380859375, -0.233673095703125, -0.20196533203125, -0.170257568359375, -0.1385498046875, -0.106842041015625, -0.07513427734375, -0.043426513671875, -0.01171875, 0.019989013671875, 0.05169677734375, 0.083404541015625, 0.1151123046875, 0.146820068359375, 0.17852783203125, 0.210235595703125, 0.241943359375, 0.273651123046875, 0.30535888671875, 0.337066650390625, 0.3687744140625, 0.400482177734375, 0.43218994140625, 0.463897705078125, 0.49560546875, 0.527313232421875, 0.55902099609375, 0.590728759765625, 0.6224365234375, 0.654144287109375, 0.68585205078125, 0.717559814453125, 0.749267578125, 0.780975341796875, 0.81268310546875, 0.844390869140625, 0.8760986328125, 0.907806396484375, 0.93951416015625, 0.971221923828125, 1.0029296875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 1.0, 4.0, 7.0, 8.0, 18.0, 22.0, 30.0, 33.0, 62.0, 68.0, 100.0, 153.0, 185.0, 279.0, 360.0, 551.0, 812.0, 1187.0, 1734.0, 2716.0, 4173.0, 6981.0, 11878.0, 21371.0, 41696.0, 88983.0, 257785.0, 379240.0, 115092.0, 50982.0, 25653.0, 14070.0, 8150.0, 4831.0, 3125.0, 1997.0, 1330.0, 887.0, 635.0, 428.0, 267.0, 184.0, 149.0, 85.0, 72.0, 52.0, 42.0, 25.0, 16.0, 14.0, 10.0, 10.0, 5.0, 9.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0], "bins": [-0.465576171875, -0.4501304626464844, -0.43468475341796875, -0.4192390441894531, -0.4037933349609375, -0.3883476257324219, -0.37290191650390625, -0.3574562072753906, -0.342010498046875, -0.3265647888183594, -0.31111907958984375, -0.2956733703613281, -0.2802276611328125, -0.2647819519042969, -0.24933624267578125, -0.23389053344726562, -0.21844482421875, -0.20299911499023438, -0.18755340576171875, -0.17210769653320312, -0.1566619873046875, -0.14121627807617188, -0.12577056884765625, -0.11032485961914062, -0.094879150390625, -0.07943344116210938, -0.06398773193359375, -0.048542022705078125, -0.0330963134765625, -0.017650604248046875, -0.00220489501953125, 0.013240814208984375, 0.0286865234375, 0.044132232666015625, 0.05957794189453125, 0.07502365112304688, 0.0904693603515625, 0.10591506958007812, 0.12136077880859375, 0.13680648803710938, 0.152252197265625, 0.16769790649414062, 0.18314361572265625, 0.19858932495117188, 0.2140350341796875, 0.22948074340820312, 0.24492645263671875, 0.2603721618652344, 0.27581787109375, 0.2912635803222656, 0.30670928955078125, 0.3221549987792969, 0.3376007080078125, 0.3530464172363281, 0.36849212646484375, 0.3839378356933594, 0.399383544921875, 0.4148292541503906, 0.43027496337890625, 0.4457206726074219, 0.4611663818359375, 0.4766120910644531, 0.49205780029296875, 0.5075035095214844, 0.52294921875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 9.0, 7.0, 9.0, 10.0, 5.0, 13.0, 9.0, 18.0, 27.0, 23.0, 19.0, 32.0, 35.0, 44.0, 41.0, 50.0, 44.0, 34.0, 37.0, 55.0, 50.0, 41.0, 44.0, 32.0, 41.0, 26.0, 36.0, 25.0, 27.0, 27.0, 25.0, 18.0, 14.0, 13.0, 17.0, 7.0, 11.0, 10.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.67626953125, -0.654388427734375, -0.63250732421875, -0.610626220703125, -0.5887451171875, -0.566864013671875, -0.54498291015625, -0.523101806640625, -0.501220703125, -0.479339599609375, -0.45745849609375, -0.435577392578125, -0.4136962890625, -0.391815185546875, -0.36993408203125, -0.348052978515625, -0.326171875, -0.304290771484375, -0.28240966796875, -0.260528564453125, -0.2386474609375, -0.216766357421875, -0.19488525390625, -0.173004150390625, -0.151123046875, -0.129241943359375, -0.10736083984375, -0.085479736328125, -0.0635986328125, -0.041717529296875, -0.01983642578125, 0.002044677734375, 0.02392578125, 0.045806884765625, 0.06768798828125, 0.089569091796875, 0.1114501953125, 0.133331298828125, 0.15521240234375, 0.177093505859375, 0.198974609375, 0.220855712890625, 0.24273681640625, 0.264617919921875, 0.2864990234375, 0.308380126953125, 0.33026123046875, 0.352142333984375, 0.3740234375, 0.395904541015625, 0.41778564453125, 0.439666748046875, 0.4615478515625, 0.483428955078125, 0.50531005859375, 0.527191162109375, 0.549072265625, 0.570953369140625, 0.59283447265625, 0.614715576171875, 0.6365966796875, 0.658477783203125, 0.68035888671875, 0.702239990234375, 0.72412109375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 5.0, 3.0, 10.0, 3.0, 19.0, 21.0, 21.0, 37.0, 59.0, 82.0, 103.0, 156.0, 241.0, 374.0, 491.0, 816.0, 1255.0, 1975.0, 3250.0, 5633.0, 10174.0, 20233.0, 46563.0, 159894.0, 632913.0, 94435.0, 33945.0, 15598.0, 8141.0, 4611.0, 2716.0, 1631.0, 1030.0, 690.0, 427.0, 288.0, 227.0, 134.0, 93.0, 73.0, 50.0, 43.0, 24.0, 19.0, 20.0, 7.0, 8.0, 3.0, 5.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.043853759765625, -0.04230546951293945, -0.040757179260253906, -0.03920888900756836, -0.03766059875488281, -0.036112308502197266, -0.03456401824951172, -0.03301572799682617, -0.031467437744140625, -0.029919147491455078, -0.02837085723876953, -0.026822566986083984, -0.025274276733398438, -0.02372598648071289, -0.022177696228027344, -0.020629405975341797, -0.01908111572265625, -0.017532825469970703, -0.015984535217285156, -0.01443624496459961, -0.012887954711914062, -0.011339664459228516, -0.009791374206542969, -0.008243083953857422, -0.006694793701171875, -0.005146503448486328, -0.0035982131958007812, -0.0020499229431152344, -0.0005016326904296875, 0.0010466575622558594, 0.0025949478149414062, 0.004143238067626953, 0.0056915283203125, 0.007239818572998047, 0.008788108825683594, 0.01033639907836914, 0.011884689331054688, 0.013432979583740234, 0.014981269836425781, 0.016529560089111328, 0.018077850341796875, 0.019626140594482422, 0.02117443084716797, 0.022722721099853516, 0.024271011352539062, 0.02581930160522461, 0.027367591857910156, 0.028915882110595703, 0.03046417236328125, 0.0320124626159668, 0.033560752868652344, 0.03510904312133789, 0.03665733337402344, 0.038205623626708984, 0.03975391387939453, 0.04130220413208008, 0.042850494384765625, 0.04439878463745117, 0.04594707489013672, 0.047495365142822266, 0.04904365539550781, 0.05059194564819336, 0.052140235900878906, 0.05368852615356445, 0.05523681640625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 5.0, 10.0, 8.0, 22.0, 19.0, 23.0, 57.0, 87.0, 116.0, 195.0, 163.0, 95.0, 42.0, 45.0, 34.0, 31.0, 12.0, 3.0, 4.0, 9.0, 4.0, 2.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.119510650634766e-06, -8.889473974704742e-06, -8.65943729877472e-06, -8.429400622844696e-06, -8.199363946914673e-06, -7.96932727098465e-06, -7.739290595054626e-06, -7.509253919124603e-06, -7.27921724319458e-06, -7.049180567264557e-06, -6.819143891334534e-06, -6.5891072154045105e-06, -6.359070539474487e-06, -6.129033863544464e-06, -5.898997187614441e-06, -5.668960511684418e-06, -5.4389238357543945e-06, -5.208887159824371e-06, -4.978850483894348e-06, -4.748813807964325e-06, -4.518777132034302e-06, -4.2887404561042786e-06, -4.058703780174255e-06, -3.828667104244232e-06, -3.598630428314209e-06, -3.368593752384186e-06, -3.1385570764541626e-06, -2.9085204005241394e-06, -2.678483724594116e-06, -2.448447048664093e-06, -2.21841037273407e-06, -1.9883736968040466e-06, -1.7583370208740234e-06, -1.5283003449440002e-06, -1.298263669013977e-06, -1.0682269930839539e-06, -8.381903171539307e-07, -6.081536412239075e-07, -3.781169652938843e-07, -1.4808028936386108e-07, 8.195638656616211e-08, 3.119930624961853e-07, 5.420297384262085e-07, 7.720664143562317e-07, 1.0021030902862549e-06, 1.232139766216278e-06, 1.4621764421463013e-06, 1.6922131180763245e-06, 1.9222497940063477e-06, 2.152286469936371e-06, 2.382323145866394e-06, 2.6123598217964172e-06, 2.8423964977264404e-06, 3.0724331736564636e-06, 3.302469849586487e-06, 3.53250652551651e-06, 3.762543201446533e-06, 3.992579877376556e-06, 4.22261655330658e-06, 4.452653229236603e-06, 4.682689905166626e-06, 4.912726581096649e-06, 5.142763257026672e-06, 5.3727999329566956e-06, 5.602836608886719e-06]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 5.0, 4.0, 5.0, 14.0, 19.0, 17.0, 47.0, 49.0, 70.0, 88.0, 125.0, 159.0, 247.0, 380.0, 493.0, 727.0, 993.0, 1425.0, 1972.0, 2905.0, 4284.0, 6736.0, 11128.0, 20508.0, 42062.0, 109096.0, 539959.0, 181502.0, 58428.0, 26606.0, 14008.0, 8153.0, 5159.0, 3407.0, 2326.0, 1577.0, 1084.0, 800.0, 600.0, 386.0, 281.0, 207.0, 152.0, 115.0, 74.0, 51.0, 45.0, 23.0, 28.0, 11.0, 8.0, 13.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0458984375, -0.044403076171875, -0.04290771484375, -0.041412353515625, -0.0399169921875, -0.038421630859375, -0.03692626953125, -0.035430908203125, -0.033935546875, -0.032440185546875, -0.03094482421875, -0.029449462890625, -0.0279541015625, -0.026458740234375, -0.02496337890625, -0.023468017578125, -0.02197265625, -0.020477294921875, -0.01898193359375, -0.017486572265625, -0.0159912109375, -0.014495849609375, -0.01300048828125, -0.011505126953125, -0.010009765625, -0.008514404296875, -0.00701904296875, -0.005523681640625, -0.0040283203125, -0.002532958984375, -0.00103759765625, 0.000457763671875, 0.001953125, 0.003448486328125, 0.00494384765625, 0.006439208984375, 0.0079345703125, 0.009429931640625, 0.01092529296875, 0.012420654296875, 0.013916015625, 0.015411376953125, 0.01690673828125, 0.018402099609375, 0.0198974609375, 0.021392822265625, 0.02288818359375, 0.024383544921875, 0.02587890625, 0.027374267578125, 0.02886962890625, 0.030364990234375, 0.0318603515625, 0.033355712890625, 0.03485107421875, 0.036346435546875, 0.037841796875, 0.039337158203125, 0.04083251953125, 0.042327880859375, 0.0438232421875, 0.045318603515625, 0.04681396484375, 0.048309326171875, 0.0498046875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 8.0, 3.0, 3.0, 4.0, 9.0, 12.0, 18.0, 18.0, 30.0, 57.0, 74.0, 112.0, 258.0, 141.0, 89.0, 36.0, 29.0, 15.0, 14.0, 9.0, 10.0, 9.0, 6.0, 6.0, 7.0, 1.0, 0.0, 5.0, 0.0, 3.0, 1.0, 1.0, 5.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0276641845703125, -0.02676105499267578, -0.025857925415039062, -0.024954795837402344, -0.024051666259765625, -0.023148536682128906, -0.022245407104492188, -0.02134227752685547, -0.02043914794921875, -0.01953601837158203, -0.018632888793945312, -0.017729759216308594, -0.016826629638671875, -0.015923500061035156, -0.015020370483398438, -0.014117240905761719, -0.013214111328125, -0.012310981750488281, -0.011407852172851562, -0.010504722595214844, -0.009601593017578125, -0.008698463439941406, -0.0077953338623046875, -0.006892204284667969, -0.00598907470703125, -0.005085945129394531, -0.0041828155517578125, -0.0032796859741210938, -0.002376556396484375, -0.0014734268188476562, -0.0005702972412109375, 0.00033283233642578125, 0.0012359619140625, 0.0021390914916992188, 0.0030422210693359375, 0.003945350646972656, 0.004848480224609375, 0.005751609802246094, 0.0066547393798828125, 0.007557868957519531, 0.00846099853515625, 0.009364128112792969, 0.010267257690429688, 0.011170387268066406, 0.012073516845703125, 0.012976646423339844, 0.013879776000976562, 0.014782905578613281, 0.01568603515625, 0.01658916473388672, 0.017492294311523438, 0.018395423889160156, 0.019298553466796875, 0.020201683044433594, 0.021104812622070312, 0.02200794219970703, 0.02291107177734375, 0.02381420135498047, 0.024717330932617188, 0.025620460510253906, 0.026523590087890625, 0.027426719665527344, 0.028329849243164062, 0.02923297882080078, 0.0301361083984375]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 8.0, 5.0, 4.0, 6.0, 7.0, 9.0, 15.0, 11.0, 27.0, 32.0, 34.0, 47.0, 70.0, 77.0, 94.0, 133.0, 84.0, 66.0, 66.0, 44.0, 35.0, 23.0, 25.0, 16.0, 15.0, 15.0, 15.0, 1.0, 3.0, 1.0, 5.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5970919132232666, -1.5505011081695557, -1.5039103031158447, -1.4573194980621338, -1.4107286930084229, -1.364137887954712, -1.317547082901001, -1.27095627784729, -1.224365472793579, -1.1777746677398682, -1.1311838626861572, -1.0845930576324463, -1.0380022525787354, -0.9914114475250244, -0.9448206424713135, -0.8982298374176025, -0.8516390919685364, -0.8050482869148254, -0.7584574818611145, -0.7118666768074036, -0.6652758717536926, -0.6186850666999817, -0.5720943212509155, -0.5255035161972046, -0.47891268134117126, -0.4323218762874603, -0.3857310712337494, -0.33914029598236084, -0.2925494909286499, -0.24595867097377777, -0.19936788082122803, -0.1527770757675171, -0.10618627071380615, -0.05959546938538551, -0.013004668056964874, 0.033586129546165466, 0.0801769345998764, 0.12676773965358734, 0.17335852980613708, 0.21994933485984802, 0.26654013991355896, 0.3131309449672699, 0.35972175002098083, 0.4063125252723694, 0.4529033303260803, 0.49949413537979126, 0.5460849404335022, 0.5926757454872131, 0.6392665505409241, 0.685857355594635, 0.732448160648346, 0.7790389657020569, 0.8256297707557678, 0.8722205758094788, 0.9188113212585449, 0.9654021263122559, 1.0119929313659668, 1.0585837364196777, 1.1051745414733887, 1.1517653465270996, 1.1983561515808105, 1.2449469566345215, 1.2915377616882324, 1.3381285667419434, 1.3847193717956543]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 5.0, 1.0, 5.0, 2.0, 4.0, 15.0, 7.0, 12.0, 12.0, 21.0, 14.0, 21.0, 17.0, 23.0, 39.0, 30.0, 26.0, 26.0, 46.0, 36.0, 32.0, 35.0, 41.0, 39.0, 26.0, 30.0, 30.0, 28.0, 23.0, 35.0, 31.0, 37.0, 27.0, 27.0, 30.0, 19.0, 23.0, 18.0, 14.0, 15.0, 16.0, 15.0, 11.0, 12.0, 4.0, 5.0, 6.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.8738977313041687, -0.8460028767585754, -0.8181079626083374, -0.7902131080627441, -0.7623182535171509, -0.7344233989715576, -0.7065285444259644, -0.6786336302757263, -0.6507387757301331, -0.6228439211845398, -0.5949490070343018, -0.5670541524887085, -0.5391592979431152, -0.511264443397522, -0.4833695590496063, -0.4554746747016907, -0.4275798201560974, -0.39968496561050415, -0.3717900812625885, -0.34389519691467285, -0.3160003423690796, -0.28810548782348633, -0.2602106034755707, -0.23231573402881622, -0.20442086458206177, -0.1765259951353073, -0.14863112568855286, -0.1207362562417984, -0.09284138679504395, -0.06494651734828949, -0.037051647901535034, -0.009156778454780579, 0.018738090991973877, 0.04663296043872833, 0.07452782988548279, 0.10242269933223724, 0.1303175687789917, 0.15821243822574615, 0.1861073076725006, 0.21400217711925507, 0.24189704656600952, 0.2697919011116028, 0.29768678545951843, 0.3255816698074341, 0.35347652435302734, 0.3813713788986206, 0.40926626324653625, 0.4371611475944519, 0.46505600214004517, 0.4929508566856384, 0.5208457708358765, 0.5487406253814697, 0.576635479927063, 0.6045303344726562, 0.6324251890182495, 0.6603201031684875, 0.6882149577140808, 0.7161098122596741, 0.7440047264099121, 0.7718995809555054, 0.7997944355010986, 0.8276892900466919, 0.8555841445922852, 0.8834790587425232, 0.9113739132881165]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 4.0, 3.0, 13.0, 20.0, 29.0, 25.0, 46.0, 53.0, 93.0, 122.0, 145.0, 262.0, 330.0, 465.0, 644.0, 920.0, 1330.0, 1913.0, 2901.0, 4130.0, 6061.0, 9149.0, 13650.0, 21444.0, 34730.0, 58704.0, 106458.0, 210605.0, 255768.0, 132556.0, 71298.0, 41324.0, 24789.0, 16027.0, 10469.0, 6844.0, 4734.0, 3235.0, 2164.0, 1552.0, 1053.0, 715.0, 514.0, 367.0, 253.0, 186.0, 136.0, 108.0, 73.0, 44.0, 33.0, 27.0, 15.0, 12.0, 6.0, 4.0, 7.0, 5.0, 0.0, 0.0, 1.0], "bins": [-1.6455078125, -1.59271240234375, -1.5399169921875, -1.48712158203125, -1.434326171875, -1.38153076171875, -1.3287353515625, -1.27593994140625, -1.22314453125, -1.17034912109375, -1.1175537109375, -1.06475830078125, -1.011962890625, -0.95916748046875, -0.9063720703125, -0.85357666015625, -0.80078125, -0.74798583984375, -0.6951904296875, -0.64239501953125, -0.589599609375, -0.53680419921875, -0.4840087890625, -0.43121337890625, -0.37841796875, -0.32562255859375, -0.2728271484375, -0.22003173828125, -0.167236328125, -0.11444091796875, -0.0616455078125, -0.00885009765625, 0.0439453125, 0.09674072265625, 0.1495361328125, 0.20233154296875, 0.255126953125, 0.30792236328125, 0.3607177734375, 0.41351318359375, 0.46630859375, 0.51910400390625, 0.5718994140625, 0.62469482421875, 0.677490234375, 0.73028564453125, 0.7830810546875, 0.83587646484375, 0.888671875, 0.94146728515625, 0.9942626953125, 1.04705810546875, 1.099853515625, 1.15264892578125, 1.2054443359375, 1.25823974609375, 1.31103515625, 1.36383056640625, 1.4166259765625, 1.46942138671875, 1.522216796875, 1.57501220703125, 1.6278076171875, 1.68060302734375, 1.7333984375]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 5.0, 2.0, 4.0, 2.0, 5.0, 6.0, 6.0, 11.0, 11.0, 14.0, 15.0, 20.0, 22.0, 24.0, 38.0, 22.0, 24.0, 32.0, 32.0, 46.0, 41.0, 43.0, 34.0, 36.0, 43.0, 30.0, 38.0, 33.0, 28.0, 26.0, 43.0, 31.0, 25.0, 31.0, 29.0, 19.0, 17.0, 25.0, 15.0, 12.0, 13.0, 9.0, 12.0, 10.0, 8.0, 6.0, 2.0, 7.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8466796875, -0.8196792602539062, -0.7926788330078125, -0.7656784057617188, -0.738677978515625, -0.7116775512695312, -0.6846771240234375, -0.6576766967773438, -0.63067626953125, -0.6036758422851562, -0.5766754150390625, -0.5496749877929688, -0.522674560546875, -0.49567413330078125, -0.4686737060546875, -0.44167327880859375, -0.4146728515625, -0.38767242431640625, -0.3606719970703125, -0.33367156982421875, -0.306671142578125, -0.27967071533203125, -0.2526702880859375, -0.22566986083984375, -0.19866943359375, -0.17166900634765625, -0.1446685791015625, -0.11766815185546875, -0.090667724609375, -0.06366729736328125, -0.0366668701171875, -0.00966644287109375, 0.017333984375, 0.04433441162109375, 0.0713348388671875, 0.09833526611328125, 0.125335693359375, 0.15233612060546875, 0.1793365478515625, 0.20633697509765625, 0.23333740234375, 0.26033782958984375, 0.2873382568359375, 0.31433868408203125, 0.341339111328125, 0.36833953857421875, 0.3953399658203125, 0.42234039306640625, 0.4493408203125, 0.47634124755859375, 0.5033416748046875, 0.5303421020507812, 0.557342529296875, 0.5843429565429688, 0.6113433837890625, 0.6383438110351562, 0.66534423828125, 0.6923446655273438, 0.7193450927734375, 0.7463455200195312, 0.773345947265625, 0.8003463745117188, 0.8273468017578125, 0.8543472290039062, 0.88134765625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 9.0, 7.0, 13.0, 13.0, 22.0, 23.0, 37.0, 67.0, 92.0, 133.0, 148.0, 229.0, 353.0, 440.0, 719.0, 997.0, 1420.0, 2086.0, 3011.0, 4373.0, 6571.0, 10105.0, 15277.0, 24323.0, 40072.0, 69134.0, 125213.0, 238717.0, 221689.0, 115369.0, 63841.0, 37642.0, 22766.0, 14357.0, 9485.0, 6143.0, 4367.0, 2888.0, 1944.0, 1418.0, 912.0, 630.0, 421.0, 328.0, 227.0, 157.0, 118.0, 76.0, 56.0, 41.0, 30.0, 19.0, 12.0, 7.0, 5.0, 3.0, 6.0, 2.0, 2.0, 3.0], "bins": [-1.6240234375, -1.5731658935546875, -1.522308349609375, -1.4714508056640625, -1.42059326171875, -1.3697357177734375, -1.318878173828125, -1.2680206298828125, -1.2171630859375, -1.1663055419921875, -1.115447998046875, -1.0645904541015625, -1.01373291015625, -0.9628753662109375, -0.912017822265625, -0.8611602783203125, -0.810302734375, -0.7594451904296875, -0.708587646484375, -0.6577301025390625, -0.60687255859375, -0.5560150146484375, -0.505157470703125, -0.4542999267578125, -0.4034423828125, -0.3525848388671875, -0.301727294921875, -0.2508697509765625, -0.20001220703125, -0.1491546630859375, -0.098297119140625, -0.0474395751953125, 0.00341796875, 0.0542755126953125, 0.105133056640625, 0.1559906005859375, 0.20684814453125, 0.2577056884765625, 0.308563232421875, 0.3594207763671875, 0.4102783203125, 0.4611358642578125, 0.511993408203125, 0.5628509521484375, 0.61370849609375, 0.6645660400390625, 0.715423583984375, 0.7662811279296875, 0.817138671875, 0.8679962158203125, 0.918853759765625, 0.9697113037109375, 1.02056884765625, 1.0714263916015625, 1.122283935546875, 1.1731414794921875, 1.2239990234375, 1.2748565673828125, 1.325714111328125, 1.3765716552734375, 1.42742919921875, 1.4782867431640625, 1.529144287109375, 1.5800018310546875, 1.630859375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 7.0, 2.0, 5.0, 0.0, 11.0, 7.0, 15.0, 18.0, 14.0, 16.0, 16.0, 22.0, 14.0, 26.0, 29.0, 21.0, 30.0, 33.0, 38.0, 32.0, 32.0, 34.0, 32.0, 34.0, 41.0, 37.0, 36.0, 40.0, 37.0, 32.0, 26.0, 17.0, 27.0, 25.0, 22.0, 31.0, 21.0, 18.0, 21.0, 15.0, 18.0, 16.0, 10.0, 9.0, 4.0, 4.0, 2.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.54736328125, -0.5311241149902344, -0.5148849487304688, -0.4986457824707031, -0.4824066162109375, -0.4661674499511719, -0.44992828369140625, -0.4336891174316406, -0.417449951171875, -0.4012107849121094, -0.38497161865234375, -0.3687324523925781, -0.3524932861328125, -0.3362541198730469, -0.32001495361328125, -0.3037757873535156, -0.28753662109375, -0.2712974548339844, -0.25505828857421875, -0.23881912231445312, -0.2225799560546875, -0.20634078979492188, -0.19010162353515625, -0.17386245727539062, -0.157623291015625, -0.14138412475585938, -0.12514495849609375, -0.10890579223632812, -0.0926666259765625, -0.07642745971679688, -0.06018829345703125, -0.043949127197265625, -0.0277099609375, -0.011470794677734375, 0.00476837158203125, 0.021007537841796875, 0.0372467041015625, 0.053485870361328125, 0.06972503662109375, 0.08596420288085938, 0.102203369140625, 0.11844253540039062, 0.13468170166015625, 0.15092086791992188, 0.1671600341796875, 0.18339920043945312, 0.19963836669921875, 0.21587753295898438, 0.23211669921875, 0.24835586547851562, 0.26459503173828125, 0.2808341979980469, 0.2970733642578125, 0.3133125305175781, 0.32955169677734375, 0.3457908630371094, 0.362030029296875, 0.3782691955566406, 0.39450836181640625, 0.4107475280761719, 0.4269866943359375, 0.4432258605957031, 0.45946502685546875, 0.4757041931152344, 0.491943359375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 10.0, 11.0, 11.0, 17.0, 24.0, 31.0, 36.0, 63.0, 89.0, 114.0, 171.0, 203.0, 282.0, 404.0, 573.0, 762.0, 1153.0, 1622.0, 2457.0, 3925.0, 6620.0, 11472.0, 22758.0, 58301.0, 803063.0, 75426.0, 26053.0, 12840.0, 7158.0, 4281.0, 2706.0, 1714.0, 1191.0, 866.0, 591.0, 441.0, 299.0, 202.0, 166.0, 129.0, 82.0, 55.0, 54.0, 42.0, 24.0, 26.0, 16.0, 8.0, 6.0, 5.0, 3.0, 5.0, 1.0, 3.0], "bins": [-1.25390625, -1.2176513671875, -1.181396484375, -1.1451416015625, -1.10888671875, -1.0726318359375, -1.036376953125, -1.0001220703125, -0.9638671875, -0.9276123046875, -0.891357421875, -0.8551025390625, -0.81884765625, -0.7825927734375, -0.746337890625, -0.7100830078125, -0.673828125, -0.6375732421875, -0.601318359375, -0.5650634765625, -0.52880859375, -0.4925537109375, -0.456298828125, -0.4200439453125, -0.3837890625, -0.3475341796875, -0.311279296875, -0.2750244140625, -0.23876953125, -0.2025146484375, -0.166259765625, -0.1300048828125, -0.09375, -0.0574951171875, -0.021240234375, 0.0150146484375, 0.05126953125, 0.0875244140625, 0.123779296875, 0.1600341796875, 0.1962890625, 0.2325439453125, 0.268798828125, 0.3050537109375, 0.34130859375, 0.3775634765625, 0.413818359375, 0.4500732421875, 0.486328125, 0.5225830078125, 0.558837890625, 0.5950927734375, 0.63134765625, 0.6676025390625, 0.703857421875, 0.7401123046875, 0.7763671875, 0.8126220703125, 0.848876953125, 0.8851318359375, 0.92138671875, 0.9576416015625, 0.993896484375, 1.0301513671875, 1.06640625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 5.0, 3.0, 7.0, 11.0, 19.0, 29.0, 40.0, 85.0, 525.0, 135.0, 52.0, 25.0, 11.0, 10.0, 13.0, 3.0, 5.0, 1.0, 6.0, 3.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.4001808166503906e-05, -5.1977112889289856e-05, -4.9952417612075806e-05, -4.7927722334861755e-05, -4.5903027057647705e-05, -4.3878331780433655e-05, -4.1853636503219604e-05, -3.9828941226005554e-05, -3.7804245948791504e-05, -3.5779550671577454e-05, -3.37548553943634e-05, -3.173016011714935e-05, -2.9705464839935303e-05, -2.7680769562721252e-05, -2.5656074285507202e-05, -2.3631379008293152e-05, -2.16066837310791e-05, -1.958198845386505e-05, -1.7557293176651e-05, -1.553259789943695e-05, -1.35079026222229e-05, -1.148320734500885e-05, -9.4585120677948e-06, -7.4338167905807495e-06, -5.409121513366699e-06, -3.384426236152649e-06, -1.3597309589385986e-06, 6.649643182754517e-07, 2.689659595489502e-06, 4.714354872703552e-06, 6.7390501499176025e-06, 8.763745427131653e-06, 1.0788440704345703e-05, 1.2813135981559753e-05, 1.4837831258773804e-05, 1.6862526535987854e-05, 1.8887221813201904e-05, 2.0911917090415955e-05, 2.2936612367630005e-05, 2.4961307644844055e-05, 2.6986002922058105e-05, 2.9010698199272156e-05, 3.1035393476486206e-05, 3.3060088753700256e-05, 3.508478403091431e-05, 3.710947930812836e-05, 3.913417458534241e-05, 4.115886986255646e-05, 4.318356513977051e-05, 4.520826041698456e-05, 4.723295569419861e-05, 4.925765097141266e-05, 5.128234624862671e-05, 5.330704152584076e-05, 5.533173680305481e-05, 5.735643208026886e-05, 5.938112735748291e-05, 6.140582263469696e-05, 6.343051791191101e-05, 6.545521318912506e-05, 6.747990846633911e-05, 6.950460374355316e-05, 7.152929902076721e-05, 7.355399429798126e-05, 7.557868957519531e-05]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 3.0, 12.0, 16.0, 27.0, 32.0, 37.0, 43.0, 75.0, 133.0, 178.0, 223.0, 331.0, 510.0, 764.0, 1077.0, 1739.0, 2646.0, 4555.0, 8645.0, 19846.0, 61772.0, 838350.0, 65478.0, 20506.0, 8891.0, 4747.0, 2686.0, 1760.0, 1109.0, 715.0, 527.0, 297.0, 256.0, 163.0, 114.0, 77.0, 69.0, 36.0, 34.0, 19.0, 17.0, 10.0, 9.0, 10.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-1.607421875, -1.5594635009765625, -1.511505126953125, -1.4635467529296875, -1.41558837890625, -1.3676300048828125, -1.319671630859375, -1.2717132568359375, -1.2237548828125, -1.1757965087890625, -1.127838134765625, -1.0798797607421875, -1.03192138671875, -0.9839630126953125, -0.936004638671875, -0.8880462646484375, -0.840087890625, -0.7921295166015625, -0.744171142578125, -0.6962127685546875, -0.64825439453125, -0.6002960205078125, -0.552337646484375, -0.5043792724609375, -0.4564208984375, -0.4084625244140625, -0.360504150390625, -0.3125457763671875, -0.26458740234375, -0.2166290283203125, -0.168670654296875, -0.1207122802734375, -0.07275390625, -0.0247955322265625, 0.023162841796875, 0.0711212158203125, 0.11907958984375, 0.1670379638671875, 0.214996337890625, 0.2629547119140625, 0.3109130859375, 0.3588714599609375, 0.406829833984375, 0.4547882080078125, 0.50274658203125, 0.5507049560546875, 0.598663330078125, 0.6466217041015625, 0.694580078125, 0.7425384521484375, 0.790496826171875, 0.8384552001953125, 0.88641357421875, 0.9343719482421875, 0.982330322265625, 1.0302886962890625, 1.0782470703125, 1.1262054443359375, 1.174163818359375, 1.2221221923828125, 1.27008056640625, 1.3180389404296875, 1.365997314453125, 1.4139556884765625, 1.4619140625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 10.0, 9.0, 13.0, 19.0, 24.0, 22.0, 76.0, 541.0, 106.0, 32.0, 33.0, 26.0, 12.0, 18.0, 8.0, 9.0, 3.0, 2.0, 5.0, 7.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.459716796875, -0.44680023193359375, -0.4338836669921875, -0.42096710205078125, -0.408050537109375, -0.39513397216796875, -0.3822174072265625, -0.36930084228515625, -0.35638427734375, -0.34346771240234375, -0.3305511474609375, -0.31763458251953125, -0.304718017578125, -0.29180145263671875, -0.2788848876953125, -0.26596832275390625, -0.2530517578125, -0.24013519287109375, -0.2272186279296875, -0.21430206298828125, -0.201385498046875, -0.18846893310546875, -0.1755523681640625, -0.16263580322265625, -0.14971923828125, -0.13680267333984375, -0.1238861083984375, -0.11096954345703125, -0.098052978515625, -0.08513641357421875, -0.0722198486328125, -0.05930328369140625, -0.04638671875, -0.03347015380859375, -0.0205535888671875, -0.00763702392578125, 0.005279541015625, 0.01819610595703125, 0.0311126708984375, 0.04402923583984375, 0.05694580078125, 0.06986236572265625, 0.0827789306640625, 0.09569549560546875, 0.108612060546875, 0.12152862548828125, 0.1344451904296875, 0.14736175537109375, 0.1602783203125, 0.17319488525390625, 0.1861114501953125, 0.19902801513671875, 0.211944580078125, 0.22486114501953125, 0.2377777099609375, 0.25069427490234375, 0.26361083984375, 0.27652740478515625, 0.2894439697265625, 0.30236053466796875, 0.315277099609375, 0.32819366455078125, 0.3411102294921875, 0.35402679443359375, 0.366943359375]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 3.0, 1.0, 2.0, 3.0, 3.0, 11.0, 8.0, 10.0, 14.0, 20.0, 19.0, 28.0, 32.0, 42.0, 53.0, 53.0, 68.0, 95.0, 93.0, 80.0, 73.0, 51.0, 35.0, 32.0, 22.0, 28.0, 21.0, 17.0, 11.0, 12.0, 10.0, 5.0, 6.0, 6.0, 6.0, 4.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0], "bins": [-1.1725246906280518, -1.136929988861084, -1.1013352870941162, -1.0657404661178589, -1.0301457643508911, -0.9945510625839233, -0.9589563012123108, -0.9233615398406982, -0.8877668380737305, -0.8521721363067627, -0.8165773749351501, -0.7809826135635376, -0.7453879117965698, -0.709793210029602, -0.6741984486579895, -0.638603687286377, -0.6030089855194092, -0.5674142837524414, -0.5318195223808289, -0.4962247908115387, -0.46063005924224854, -0.4250353276729584, -0.3894405961036682, -0.35384586453437805, -0.3182511329650879, -0.28265640139579773, -0.24706166982650757, -0.2114669382572174, -0.17587220668792725, -0.14027747511863708, -0.10468274354934692, -0.06908801198005676, -0.03349316120147705, 0.0021015703678131104, 0.03769630193710327, 0.07329103350639343, 0.1088857650756836, 0.14448049664497375, 0.18007522821426392, 0.21566995978355408, 0.25126469135284424, 0.2868594229221344, 0.32245415449142456, 0.3580488860607147, 0.3936436176300049, 0.42923834919929504, 0.4648330807685852, 0.5004278421401978, 0.5360225439071655, 0.5716172456741333, 0.6072120070457458, 0.6428067684173584, 0.6784014701843262, 0.713996171951294, 0.7495909333229065, 0.785185694694519, 0.8207803964614868, 0.8563750982284546, 0.8919698596000671, 0.9275646209716797, 0.9631593227386475, 0.9987540245056152, 1.034348726272583, 1.0699435472488403, 1.105538249015808]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 2.0, 5.0, 7.0, 5.0, 10.0, 12.0, 14.0, 13.0, 17.0, 27.0, 21.0, 28.0, 31.0, 40.0, 41.0, 42.0, 37.0, 41.0, 36.0, 38.0, 31.0, 39.0, 42.0, 37.0, 44.0, 27.0, 40.0, 26.0, 22.0, 27.0, 21.0, 26.0, 19.0, 20.0, 19.0, 16.0, 17.0, 9.0, 11.0, 9.0, 8.0, 7.0, 6.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8190056681632996, -0.7898914217948914, -0.7607771754264832, -0.731662929058075, -0.702548623085022, -0.6734343767166138, -0.6443201303482056, -0.6152058839797974, -0.5860916376113892, -0.556977391242981, -0.5278631448745728, -0.49874886870384216, -0.46963462233543396, -0.44052037596702576, -0.41140609979629517, -0.38229185342788696, -0.35317760705947876, -0.32406336069107056, -0.29494911432266235, -0.26583483815193176, -0.23672059178352356, -0.20760634541511536, -0.17849208414554596, -0.14937782287597656, -0.12026357650756836, -0.09114932268857956, -0.06203506886959076, -0.03292081505060196, -0.003806561231613159, 0.025307685136795044, 0.05442194640636444, 0.08353620767593384, 0.11265051364898682, 0.14176476001739502, 0.17087902128696442, 0.1999932825565338, 0.22910752892494202, 0.2582217752933502, 0.2873360514640808, 0.316450297832489, 0.3455645442008972, 0.3746787905693054, 0.4037930369377136, 0.4329073131084442, 0.4620215594768524, 0.4911358058452606, 0.5202500820159912, 0.5493643283843994, 0.5784785747528076, 0.6075928211212158, 0.636707067489624, 0.6658213138580322, 0.6949355602264404, 0.7240498065948486, 0.7531641125679016, 0.7822783589363098, 0.811392605304718, 0.8405068516731262, 0.8696210980415344, 0.8987353444099426, 0.9278496503829956, 0.9569638967514038, 0.986078143119812, 1.0151923894882202, 1.0443066358566284]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 4.0, 10.0, 20.0, 21.0, 29.0, 46.0, 56.0, 74.0, 115.0, 165.0, 297.0, 439.0, 670.0, 981.0, 1538.0, 2296.0, 3660.0, 5808.0, 9411.0, 15149.0, 24921.0, 42274.0, 75723.0, 144001.0, 318958.0, 1035870.0, 1591188.0, 490624.0, 193867.0, 97767.0, 53667.0, 31465.0, 19098.0, 11936.0, 7843.0, 4894.0, 3114.0, 2010.0, 1382.0, 878.0, 665.0, 436.0, 296.0, 200.0, 138.0, 99.0, 48.0, 38.0, 30.0, 16.0, 19.0, 10.0, 10.0, 7.0, 7.0, 3.0, 1.0, 3.0, 0.0, 2.0], "bins": [-1.23046875, -1.1897430419921875, -1.149017333984375, -1.1082916259765625, -1.06756591796875, -1.0268402099609375, -0.986114501953125, -0.9453887939453125, -0.9046630859375, -0.8639373779296875, -0.823211669921875, -0.7824859619140625, -0.74176025390625, -0.7010345458984375, -0.660308837890625, -0.6195831298828125, -0.578857421875, -0.5381317138671875, -0.497406005859375, -0.4566802978515625, -0.41595458984375, -0.3752288818359375, -0.334503173828125, -0.2937774658203125, -0.2530517578125, -0.2123260498046875, -0.171600341796875, -0.1308746337890625, -0.09014892578125, -0.0494232177734375, -0.008697509765625, 0.0320281982421875, 0.07275390625, 0.1134796142578125, 0.154205322265625, 0.1949310302734375, 0.23565673828125, 0.2763824462890625, 0.317108154296875, 0.3578338623046875, 0.3985595703125, 0.4392852783203125, 0.480010986328125, 0.5207366943359375, 0.56146240234375, 0.6021881103515625, 0.642913818359375, 0.6836395263671875, 0.724365234375, 0.7650909423828125, 0.805816650390625, 0.8465423583984375, 0.88726806640625, 0.9279937744140625, 0.968719482421875, 1.0094451904296875, 1.0501708984375, 1.0908966064453125, 1.131622314453125, 1.1723480224609375, 1.21307373046875, 1.2537994384765625, 1.294525146484375, 1.3352508544921875, 1.3759765625]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 2.0, 1.0, 5.0, 4.0, 8.0, 11.0, 12.0, 14.0, 14.0, 15.0, 20.0, 19.0, 27.0, 34.0, 32.0, 36.0, 35.0, 38.0, 29.0, 35.0, 41.0, 52.0, 39.0, 31.0, 32.0, 39.0, 33.0, 36.0, 23.0, 30.0, 24.0, 36.0, 22.0, 23.0, 21.0, 21.0, 13.0, 15.0, 10.0, 19.0, 13.0, 4.0, 7.0, 7.0, 6.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.5166015625, -0.498779296875, -0.48095703125, -0.463134765625, -0.4453125, -0.427490234375, -0.40966796875, -0.391845703125, -0.3740234375, -0.356201171875, -0.33837890625, -0.320556640625, -0.302734375, -0.284912109375, -0.26708984375, -0.249267578125, -0.2314453125, -0.213623046875, -0.19580078125, -0.177978515625, -0.16015625, -0.142333984375, -0.12451171875, -0.106689453125, -0.0888671875, -0.071044921875, -0.05322265625, -0.035400390625, -0.017578125, 0.000244140625, 0.01806640625, 0.035888671875, 0.0537109375, 0.071533203125, 0.08935546875, 0.107177734375, 0.125, 0.142822265625, 0.16064453125, 0.178466796875, 0.1962890625, 0.214111328125, 0.23193359375, 0.249755859375, 0.267578125, 0.285400390625, 0.30322265625, 0.321044921875, 0.3388671875, 0.356689453125, 0.37451171875, 0.392333984375, 0.41015625, 0.427978515625, 0.44580078125, 0.463623046875, 0.4814453125, 0.499267578125, 0.51708984375, 0.534912109375, 0.552734375, 0.570556640625, 0.58837890625, 0.606201171875, 0.6240234375]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 5.0, 15.0, 15.0, 19.0, 41.0, 53.0, 64.0, 102.0, 140.0, 220.0, 310.0, 488.0, 768.0, 1140.0, 1697.0, 2668.0, 3922.0, 6202.0, 9762.0, 15335.0, 24219.0, 39376.0, 64706.0, 109848.0, 200068.0, 396356.0, 998676.0, 1274840.0, 487115.0, 234372.0, 127691.0, 73973.0, 44617.0, 27410.0, 17169.0, 10900.0, 6971.0, 4469.0, 2919.0, 1891.0, 1294.0, 787.0, 540.0, 376.0, 211.0, 180.0, 115.0, 63.0, 45.0, 46.0, 25.0, 23.0, 13.0, 12.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.9580078125, -0.9272308349609375, -0.896453857421875, -0.8656768798828125, -0.83489990234375, -0.8041229248046875, -0.773345947265625, -0.7425689697265625, -0.7117919921875, -0.6810150146484375, -0.650238037109375, -0.6194610595703125, -0.58868408203125, -0.5579071044921875, -0.527130126953125, -0.4963531494140625, -0.465576171875, -0.4347991943359375, -0.404022216796875, -0.3732452392578125, -0.34246826171875, -0.3116912841796875, -0.280914306640625, -0.2501373291015625, -0.2193603515625, -0.1885833740234375, -0.157806396484375, -0.1270294189453125, -0.09625244140625, -0.0654754638671875, -0.034698486328125, -0.0039215087890625, 0.02685546875, 0.0576324462890625, 0.088409423828125, 0.1191864013671875, 0.14996337890625, 0.1807403564453125, 0.211517333984375, 0.2422943115234375, 0.2730712890625, 0.3038482666015625, 0.334625244140625, 0.3654022216796875, 0.39617919921875, 0.4269561767578125, 0.457733154296875, 0.4885101318359375, 0.519287109375, 0.5500640869140625, 0.580841064453125, 0.6116180419921875, 0.64239501953125, 0.6731719970703125, 0.703948974609375, 0.7347259521484375, 0.7655029296875, 0.7962799072265625, 0.827056884765625, 0.8578338623046875, 0.88861083984375, 0.9193878173828125, 0.950164794921875, 0.9809417724609375, 1.01171875]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 6.0, 8.0, 15.0, 19.0, 15.0, 33.0, 32.0, 48.0, 44.0, 65.0, 67.0, 82.0, 112.0, 102.0, 138.0, 137.0, 181.0, 170.0, 235.0, 243.0, 229.0, 257.0, 228.0, 238.0, 181.0, 185.0, 154.0, 140.0, 113.0, 103.0, 86.0, 81.0, 65.0, 58.0, 44.0, 30.0, 27.0, 27.0, 15.0, 11.0, 10.0, 9.0, 13.0, 6.0, 8.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.32275390625, -0.3131141662597656, -0.30347442626953125, -0.2938346862792969, -0.2841949462890625, -0.2745552062988281, -0.26491546630859375, -0.2552757263183594, -0.245635986328125, -0.23599624633789062, -0.22635650634765625, -0.21671676635742188, -0.2070770263671875, -0.19743728637695312, -0.18779754638671875, -0.17815780639648438, -0.16851806640625, -0.15887832641601562, -0.14923858642578125, -0.13959884643554688, -0.1299591064453125, -0.12031936645507812, -0.11067962646484375, -0.10103988647460938, -0.091400146484375, -0.08176040649414062, -0.07212066650390625, -0.062480926513671875, -0.0528411865234375, -0.043201446533203125, -0.03356170654296875, -0.023921966552734375, -0.0142822265625, -0.004642486572265625, 0.00499725341796875, 0.014636993408203125, 0.0242767333984375, 0.033916473388671875, 0.04355621337890625, 0.053195953369140625, 0.062835693359375, 0.07247543334960938, 0.08211517333984375, 0.09175491333007812, 0.1013946533203125, 0.11103439331054688, 0.12067413330078125, 0.13031387329101562, 0.13995361328125, 0.14959335327148438, 0.15923309326171875, 0.16887283325195312, 0.1785125732421875, 0.18815231323242188, 0.19779205322265625, 0.20743179321289062, 0.217071533203125, 0.22671127319335938, 0.23635101318359375, 0.24599075317382812, 0.2556304931640625, 0.2652702331542969, 0.27490997314453125, 0.2845497131347656, 0.294189453125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 6.0, 5.0, 3.0, 4.0, 10.0, 8.0, 8.0, 12.0, 18.0, 19.0, 21.0, 35.0, 37.0, 59.0, 70.0, 100.0, 90.0, 102.0, 74.0, 73.0, 55.0, 41.0, 31.0, 22.0, 26.0, 19.0, 8.0, 7.0, 9.0, 7.0, 4.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9248051643371582, -0.8949794173240662, -0.8651536703109741, -0.8353279232978821, -0.80550217628479, -0.775676429271698, -0.745850682258606, -0.7160249948501587, -0.6861991882324219, -0.6563734412193298, -0.6265476942062378, -0.5967219471931458, -0.5668962001800537, -0.5370704531669617, -0.5072447061538696, -0.4774189889431, -0.4475932717323303, -0.4177675247192383, -0.38794177770614624, -0.3581160306930542, -0.32829028367996216, -0.2984645366668701, -0.26863881945610046, -0.23881307244300842, -0.20898732542991638, -0.17916157841682434, -0.1493358314037323, -0.11951009929180145, -0.08968435227870941, -0.05985860526561737, -0.030032873153686523, -0.00020712614059448242, 0.029618680477142334, 0.05944442376494408, 0.08927016705274582, 0.11909590661525726, 0.1489216536283493, 0.17874740064144135, 0.2085731327533722, 0.23839887976646423, 0.2682246267795563, 0.2980503737926483, 0.32787612080574036, 0.35770183801651, 0.38752758502960205, 0.4173533320426941, 0.44717907905578613, 0.4770048260688782, 0.5068305730819702, 0.5366563200950623, 0.5664820671081543, 0.5963078141212463, 0.6261335611343384, 0.6559593081474304, 0.6857850551605225, 0.7156107425689697, 0.7454365491867065, 0.7752622961997986, 0.8050880432128906, 0.8349137902259827, 0.8647395372390747, 0.8945652842521667, 0.9243910312652588, 0.954216718673706, 0.9840424656867981]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 5.0, 4.0, 8.0, 7.0, 8.0, 8.0, 11.0, 20.0, 17.0, 22.0, 15.0, 22.0, 25.0, 25.0, 29.0, 42.0, 40.0, 37.0, 41.0, 43.0, 33.0, 42.0, 35.0, 44.0, 28.0, 31.0, 40.0, 43.0, 33.0, 21.0, 23.0, 32.0, 18.0, 24.0, 20.0, 10.0, 18.0, 21.0, 13.0, 12.0, 6.0, 8.0, 2.0, 11.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6352312564849854, -0.6149871349334717, -0.5947430729866028, -0.5744989514350891, -0.5542548298835754, -0.5340107679367065, -0.5137666463851929, -0.4935225248336792, -0.4732784330844879, -0.45303434133529663, -0.43279021978378296, -0.4125461280345917, -0.3923020362854004, -0.3720579147338867, -0.35181382298469543, -0.33156973123550415, -0.3113256096839905, -0.2910815179347992, -0.2708373963832855, -0.25059330463409424, -0.23034919798374176, -0.21010509133338928, -0.189860999584198, -0.16961689293384552, -0.14937278628349304, -0.12912867963314056, -0.10888458043336868, -0.0886404812335968, -0.06839637458324432, -0.048152267932891846, -0.027908168733119965, -0.0076640695333480835, 0.012580037117004395, 0.032824140042066574, 0.053068242967128754, 0.07331234216690063, 0.09355644881725311, 0.11380055546760559, 0.13404464721679688, 0.15428875386714935, 0.17453286051750183, 0.1947769671678543, 0.2150210738182068, 0.23526516556739807, 0.25550925731658936, 0.275753378868103, 0.2959974706172943, 0.3162415623664856, 0.33648568391799927, 0.35672977566719055, 0.3769738972187042, 0.3972179889678955, 0.4174621105194092, 0.43770620226860046, 0.45795029401779175, 0.4781944155693054, 0.4984385073184967, 0.518682599067688, 0.5389267206192017, 0.5591708421707153, 0.5794149041175842, 0.5996590256690979, 0.6199031472206116, 0.6401472091674805, 0.6603913307189941]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 5.0, 4.0, 4.0, 14.0, 11.0, 29.0, 32.0, 30.0, 59.0, 73.0, 106.0, 166.0, 206.0, 316.0, 459.0, 625.0, 1093.0, 1751.0, 2507.0, 4059.0, 6342.0, 10381.0, 17384.0, 30057.0, 55517.0, 111122.0, 261113.0, 287040.0, 119094.0, 58968.0, 31943.0, 18379.0, 10923.0, 6765.0, 4175.0, 2712.0, 1657.0, 1045.0, 744.0, 473.0, 353.0, 248.0, 180.0, 119.0, 71.0, 55.0, 38.0, 29.0, 23.0, 19.0, 15.0, 8.0, 9.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.2452392578125, -0.2370777130126953, -0.22891616821289062, -0.22075462341308594, -0.21259307861328125, -0.20443153381347656, -0.19626998901367188, -0.1881084442138672, -0.1799468994140625, -0.1717853546142578, -0.16362380981445312, -0.15546226501464844, -0.14730072021484375, -0.13913917541503906, -0.13097763061523438, -0.12281608581542969, -0.114654541015625, -0.10649299621582031, -0.09833145141601562, -0.09016990661621094, -0.08200836181640625, -0.07384681701660156, -0.06568527221679688, -0.05752372741699219, -0.0493621826171875, -0.04120063781738281, -0.033039093017578125, -0.024877548217773438, -0.01671600341796875, -0.008554458618164062, -0.000392913818359375, 0.0077686309814453125, 0.01593017578125, 0.024091720581054688, 0.032253265380859375, 0.04041481018066406, 0.04857635498046875, 0.05673789978027344, 0.06489944458007812, 0.07306098937988281, 0.0812225341796875, 0.08938407897949219, 0.09754562377929688, 0.10570716857910156, 0.11386871337890625, 0.12203025817871094, 0.13019180297851562, 0.1383533477783203, 0.146514892578125, 0.1546764373779297, 0.16283798217773438, 0.17099952697753906, 0.17916107177734375, 0.18732261657714844, 0.19548416137695312, 0.2036457061767578, 0.2118072509765625, 0.2199687957763672, 0.22813034057617188, 0.23629188537597656, 0.24445343017578125, 0.25261497497558594, 0.2607765197753906, 0.2689380645751953, 0.277099609375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 11.0, 9.0, 5.0, 11.0, 11.0, 21.0, 13.0, 15.0, 19.0, 24.0, 23.0, 27.0, 29.0, 34.0, 45.0, 40.0, 40.0, 34.0, 38.0, 43.0, 37.0, 34.0, 39.0, 30.0, 38.0, 45.0, 39.0, 21.0, 20.0, 19.0, 18.0, 18.0, 25.0, 18.0, 18.0, 16.0, 13.0, 13.0, 9.0, 9.0, 2.0, 6.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.603515625, -0.5829391479492188, -0.5623626708984375, -0.5417861938476562, -0.521209716796875, -0.5006332397460938, -0.4800567626953125, -0.45948028564453125, -0.43890380859375, -0.41832733154296875, -0.3977508544921875, -0.37717437744140625, -0.356597900390625, -0.33602142333984375, -0.3154449462890625, -0.29486846923828125, -0.2742919921875, -0.25371551513671875, -0.2331390380859375, -0.21256256103515625, -0.191986083984375, -0.17140960693359375, -0.1508331298828125, -0.13025665283203125, -0.10968017578125, -0.08910369873046875, -0.0685272216796875, -0.04795074462890625, -0.027374267578125, -0.00679779052734375, 0.0137786865234375, 0.03435516357421875, 0.054931640625, 0.07550811767578125, 0.0960845947265625, 0.11666107177734375, 0.137237548828125, 0.15781402587890625, 0.1783905029296875, 0.19896697998046875, 0.21954345703125, 0.24011993408203125, 0.2606964111328125, 0.28127288818359375, 0.301849365234375, 0.32242584228515625, 0.3430023193359375, 0.36357879638671875, 0.3841552734375, 0.40473175048828125, 0.4253082275390625, 0.44588470458984375, 0.466461181640625, 0.48703765869140625, 0.5076141357421875, 0.5281906127929688, 0.54876708984375, 0.5693435668945312, 0.5899200439453125, 0.6104965209960938, 0.631072998046875, 0.6516494750976562, 0.6722259521484375, 0.6928024291992188, 0.71337890625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 9.0, 2.0, 8.0, 9.0, 17.0, 23.0, 19.0, 39.0, 35.0, 51.0, 103.0, 128.0, 132.0, 221.0, 329.0, 517.0, 658.0, 1021.0, 1639.0, 2299.0, 3820.0, 6066.0, 9886.0, 17074.0, 31461.0, 63414.0, 158077.0, 433866.0, 171110.0, 67629.0, 33066.0, 17783.0, 10346.0, 6304.0, 3771.0, 2508.0, 1609.0, 1074.0, 732.0, 510.0, 361.0, 260.0, 180.0, 107.0, 79.0, 70.0, 42.0, 34.0, 26.0, 10.0, 12.0, 5.0, 7.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.310791015625, -0.3006134033203125, -0.290435791015625, -0.2802581787109375, -0.27008056640625, -0.2599029541015625, -0.249725341796875, -0.2395477294921875, -0.2293701171875, -0.2191925048828125, -0.209014892578125, -0.1988372802734375, -0.18865966796875, -0.1784820556640625, -0.168304443359375, -0.1581268310546875, -0.14794921875, -0.1377716064453125, -0.127593994140625, -0.1174163818359375, -0.10723876953125, -0.0970611572265625, -0.086883544921875, -0.0767059326171875, -0.0665283203125, -0.0563507080078125, -0.046173095703125, -0.0359954833984375, -0.02581787109375, -0.0156402587890625, -0.005462646484375, 0.0047149658203125, 0.014892578125, 0.0250701904296875, 0.035247802734375, 0.0454254150390625, 0.05560302734375, 0.0657806396484375, 0.075958251953125, 0.0861358642578125, 0.0963134765625, 0.1064910888671875, 0.116668701171875, 0.1268463134765625, 0.13702392578125, 0.1472015380859375, 0.157379150390625, 0.1675567626953125, 0.177734375, 0.1879119873046875, 0.198089599609375, 0.2082672119140625, 0.21844482421875, 0.2286224365234375, 0.238800048828125, 0.2489776611328125, 0.2591552734375, 0.2693328857421875, 0.279510498046875, 0.2896881103515625, 0.29986572265625, 0.3100433349609375, 0.320220947265625, 0.3303985595703125, 0.340576171875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 9.0, 11.0, 11.0, 16.0, 7.0, 15.0, 23.0, 20.0, 23.0, 26.0, 28.0, 28.0, 32.0, 33.0, 44.0, 36.0, 29.0, 41.0, 44.0, 37.0, 39.0, 47.0, 32.0, 31.0, 27.0, 33.0, 34.0, 23.0, 28.0, 26.0, 30.0, 21.0, 13.0, 16.0, 14.0, 13.0, 10.0, 6.0, 5.0, 6.0, 5.0, 5.0, 4.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.363037109375, -0.34993743896484375, -0.3368377685546875, -0.32373809814453125, -0.310638427734375, -0.29753875732421875, -0.2844390869140625, -0.27133941650390625, -0.25823974609375, -0.24514007568359375, -0.2320404052734375, -0.21894073486328125, -0.205841064453125, -0.19274139404296875, -0.1796417236328125, -0.16654205322265625, -0.1534423828125, -0.14034271240234375, -0.1272430419921875, -0.11414337158203125, -0.101043701171875, -0.08794403076171875, -0.0748443603515625, -0.06174468994140625, -0.04864501953125, -0.03554534912109375, -0.0224456787109375, -0.00934600830078125, 0.003753662109375, 0.01685333251953125, 0.0299530029296875, 0.04305267333984375, 0.05615234375, 0.06925201416015625, 0.0823516845703125, 0.09545135498046875, 0.108551025390625, 0.12165069580078125, 0.1347503662109375, 0.14785003662109375, 0.16094970703125, 0.17404937744140625, 0.1871490478515625, 0.20024871826171875, 0.213348388671875, 0.22644805908203125, 0.2395477294921875, 0.25264739990234375, 0.2657470703125, 0.27884674072265625, 0.2919464111328125, 0.30504608154296875, 0.318145751953125, 0.33124542236328125, 0.3443450927734375, 0.35744476318359375, 0.37054443359375, 0.38364410400390625, 0.3967437744140625, 0.40984344482421875, 0.422943115234375, 0.43604278564453125, 0.4491424560546875, 0.46224212646484375, 0.475341796875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 10.0, 10.0, 16.0, 18.0, 27.0, 43.0, 54.0, 60.0, 86.0, 127.0, 184.0, 286.0, 411.0, 574.0, 828.0, 1278.0, 2086.0, 3320.0, 5798.0, 11492.0, 26049.0, 89156.0, 721105.0, 123687.0, 31931.0, 13097.0, 6426.0, 3787.0, 2245.0, 1360.0, 930.0, 649.0, 438.0, 268.0, 211.0, 163.0, 102.0, 70.0, 55.0, 32.0, 19.0, 24.0, 15.0, 8.0, 9.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.06634521484375, -0.06417655944824219, -0.062007904052734375, -0.05983924865722656, -0.05767059326171875, -0.05550193786621094, -0.053333282470703125, -0.05116462707519531, -0.0489959716796875, -0.04682731628417969, -0.044658660888671875, -0.04249000549316406, -0.04032135009765625, -0.03815269470214844, -0.035984039306640625, -0.03381538391113281, -0.031646728515625, -0.029478073120117188, -0.027309417724609375, -0.025140762329101562, -0.02297210693359375, -0.020803451538085938, -0.018634796142578125, -0.016466140747070312, -0.0142974853515625, -0.012128829956054688, -0.009960174560546875, -0.0077915191650390625, -0.00562286376953125, -0.0034542083740234375, -0.001285552978515625, 0.0008831024169921875, 0.0030517578125, 0.0052204132080078125, 0.007389068603515625, 0.009557723999023438, 0.01172637939453125, 0.013895034790039062, 0.016063690185546875, 0.018232345581054688, 0.0204010009765625, 0.022569656372070312, 0.024738311767578125, 0.026906967163085938, 0.02907562255859375, 0.031244277954101562, 0.033412933349609375, 0.03558158874511719, 0.037750244140625, 0.03991889953613281, 0.042087554931640625, 0.04425621032714844, 0.04642486572265625, 0.04859352111816406, 0.050762176513671875, 0.05293083190917969, 0.0550994873046875, 0.05726814270019531, 0.059436798095703125, 0.06160545349121094, 0.06377410888671875, 0.06594276428222656, 0.06811141967773438, 0.07028007507324219, 0.07244873046875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 8.0, 8.0, 12.0, 10.0, 27.0, 33.0, 53.0, 102.0, 207.0, 158.0, 163.0, 78.0, 39.0, 28.0, 25.0, 10.0, 8.0, 5.0, 5.0, 6.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.212162017822266e-06, -6.981194019317627e-06, -6.750226020812988e-06, -6.51925802230835e-06, -6.288290023803711e-06, -6.057322025299072e-06, -5.826354026794434e-06, -5.595386028289795e-06, -5.364418029785156e-06, -5.133450031280518e-06, -4.902482032775879e-06, -4.67151403427124e-06, -4.4405460357666016e-06, -4.209578037261963e-06, -3.978610038757324e-06, -3.7476420402526855e-06, -3.516674041748047e-06, -3.285706043243408e-06, -3.0547380447387695e-06, -2.823770046234131e-06, -2.592802047729492e-06, -2.3618340492248535e-06, -2.130866050720215e-06, -1.8998980522155762e-06, -1.6689300537109375e-06, -1.4379620552062988e-06, -1.2069940567016602e-06, -9.760260581970215e-07, -7.450580596923828e-07, -5.140900611877441e-07, -2.8312206268310547e-07, -5.21540641784668e-08, 1.7881393432617188e-07, 4.0978193283081055e-07, 6.407499313354492e-07, 8.717179298400879e-07, 1.1026859283447266e-06, 1.3336539268493652e-06, 1.564621925354004e-06, 1.7955899238586426e-06, 2.0265579223632812e-06, 2.25752592086792e-06, 2.4884939193725586e-06, 2.7194619178771973e-06, 2.950429916381836e-06, 3.1813979148864746e-06, 3.4123659133911133e-06, 3.643333911895752e-06, 3.874301910400391e-06, 4.105269908905029e-06, 4.336237907409668e-06, 4.567205905914307e-06, 4.798173904418945e-06, 5.029141902923584e-06, 5.260109901428223e-06, 5.491077899932861e-06, 5.7220458984375e-06, 5.953013896942139e-06, 6.183981895446777e-06, 6.414949893951416e-06, 6.645917892456055e-06, 6.876885890960693e-06, 7.107853889465332e-06, 7.338821887969971e-06, 7.569789886474609e-06]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 4.0, 5.0, 4.0, 6.0, 17.0, 28.0, 22.0, 34.0, 49.0, 71.0, 111.0, 135.0, 186.0, 301.0, 422.0, 550.0, 881.0, 1231.0, 1820.0, 2724.0, 4235.0, 6693.0, 11213.0, 21818.0, 54210.0, 431530.0, 404202.0, 53931.0, 21491.0, 11302.0, 6537.0, 4184.0, 2747.0, 1846.0, 1239.0, 833.0, 578.0, 406.0, 259.0, 214.0, 151.0, 84.0, 77.0, 61.0, 34.0, 19.0, 19.0, 17.0, 8.0, 8.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0799560546875, -0.07753276824951172, -0.07510948181152344, -0.07268619537353516, -0.07026290893554688, -0.0678396224975586, -0.06541633605957031, -0.06299304962158203, -0.06056976318359375, -0.05814647674560547, -0.05572319030761719, -0.053299903869628906, -0.050876617431640625, -0.048453330993652344, -0.04603004455566406, -0.04360675811767578, -0.0411834716796875, -0.03876018524169922, -0.03633689880371094, -0.033913612365722656, -0.031490325927734375, -0.029067039489746094, -0.026643753051757812, -0.02422046661376953, -0.02179718017578125, -0.01937389373779297, -0.016950607299804688, -0.014527320861816406, -0.012104034423828125, -0.009680747985839844, -0.0072574615478515625, -0.004834175109863281, -0.002410888671875, 1.239776611328125e-05, 0.0024356842041015625, 0.004858970642089844, 0.007282257080078125, 0.009705543518066406, 0.012128829956054688, 0.014552116394042969, 0.01697540283203125, 0.01939868927001953, 0.021821975708007812, 0.024245262145996094, 0.026668548583984375, 0.029091835021972656, 0.03151512145996094, 0.03393840789794922, 0.0363616943359375, 0.03878498077392578, 0.04120826721191406, 0.043631553649902344, 0.046054840087890625, 0.048478126525878906, 0.05090141296386719, 0.05332469940185547, 0.05574798583984375, 0.05817127227783203, 0.06059455871582031, 0.0630178451538086, 0.06544113159179688, 0.06786441802978516, 0.07028770446777344, 0.07271099090576172, 0.07513427734375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 2.0, 8.0, 8.0, 7.0, 7.0, 12.0, 15.0, 14.0, 28.0, 49.0, 70.0, 148.0, 225.0, 119.0, 80.0, 45.0, 30.0, 23.0, 16.0, 13.0, 13.0, 11.0, 6.0, 3.0, 5.0, 7.0, 7.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.01459503173828125, -0.014171481132507324, -0.013747930526733398, -0.013324379920959473, -0.012900829315185547, -0.012477278709411621, -0.012053728103637695, -0.01163017749786377, -0.011206626892089844, -0.010783076286315918, -0.010359525680541992, -0.009935975074768066, -0.00951242446899414, -0.009088873863220215, -0.008665323257446289, -0.008241772651672363, -0.007818222045898438, -0.007394671440124512, -0.006971120834350586, -0.00654757022857666, -0.006124019622802734, -0.005700469017028809, -0.005276918411254883, -0.004853367805480957, -0.004429817199707031, -0.0040062665939331055, -0.0035827159881591797, -0.003159165382385254, -0.002735614776611328, -0.0023120641708374023, -0.0018885135650634766, -0.0014649629592895508, -0.001041412353515625, -0.0006178617477416992, -0.00019431114196777344, 0.00022923946380615234, 0.0006527900695800781, 0.001076340675354004, 0.0014998912811279297, 0.0019234418869018555, 0.0023469924926757812, 0.002770543098449707, 0.003194093704223633, 0.0036176443099975586, 0.004041194915771484, 0.00446474552154541, 0.004888296127319336, 0.005311846733093262, 0.0057353973388671875, 0.006158947944641113, 0.006582498550415039, 0.007006049156188965, 0.007429599761962891, 0.007853150367736816, 0.008276700973510742, 0.008700251579284668, 0.009123802185058594, 0.00954735279083252, 0.009970903396606445, 0.010394454002380371, 0.010818004608154297, 0.011241555213928223, 0.011665105819702148, 0.012088656425476074, 0.01251220703125]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 0.0, 5.0, 5.0, 3.0, 6.0, 6.0, 10.0, 10.0, 10.0, 18.0, 19.0, 24.0, 23.0, 43.0, 56.0, 66.0, 87.0, 95.0, 107.0, 69.0, 75.0, 59.0, 42.0, 32.0, 34.0, 14.0, 23.0, 10.0, 11.0, 5.0, 12.0, 3.0, 4.0, 7.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9049148559570312, -0.8758485317230225, -0.8467822670936584, -0.8177159428596497, -0.7886496782302856, -0.7595833539962769, -0.7305170297622681, -0.701450765132904, -0.67238450050354, -0.6433181762695312, -0.6142519116401672, -0.5851855874061584, -0.5561193227767944, -0.5270529985427856, -0.49798670411109924, -0.46892040967941284, -0.43985408544540405, -0.41078779101371765, -0.38172149658203125, -0.35265517234802246, -0.32358890771865845, -0.29452258348464966, -0.26545628905296326, -0.23638999462127686, -0.20732370018959045, -0.17825740575790405, -0.14919111132621765, -0.12012480199337006, -0.09105850756168365, -0.06199221312999725, -0.03292590379714966, -0.003859609365463257, 0.02520674467086792, 0.05427304282784462, 0.08333934098482132, 0.11240564286708832, 0.14147193729877472, 0.17053823173046112, 0.19960454106330872, 0.22867083549499512, 0.2577371299266815, 0.2868034243583679, 0.3158697187900543, 0.3449360132217407, 0.3740023374557495, 0.4030686020851135, 0.4321349263191223, 0.4612012207508087, 0.4902675151824951, 0.5193338394165039, 0.5484001040458679, 0.5774664282798767, 0.6065326929092407, 0.6355990171432495, 0.6646653413772583, 0.6937316060066223, 0.7227978706359863, 0.7518641948699951, 0.7809304594993591, 0.8099967837333679, 0.8390630483627319, 0.8681293725967407, 0.8971956968307495, 0.9262619614601135, 0.9553282856941223]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 1.0, 6.0, 4.0, 8.0, 7.0, 7.0, 9.0, 11.0, 20.0, 17.0, 23.0, 15.0, 23.0, 24.0, 22.0, 34.0, 38.0, 41.0, 35.0, 41.0, 41.0, 36.0, 44.0, 30.0, 45.0, 31.0, 32.0, 41.0, 46.0, 28.0, 19.0, 26.0, 30.0, 19.0, 23.0, 19.0, 11.0, 18.0, 21.0, 13.0, 12.0, 6.0, 8.0, 4.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6312729120254517, -0.6111021041870117, -0.590931236743927, -0.5707604289054871, -0.5505896210670471, -0.5304187536239624, -0.5102479457855225, -0.4900771379470825, -0.4699063003063202, -0.44973546266555786, -0.4295646548271179, -0.4093938171863556, -0.38922297954559326, -0.3690521717071533, -0.348881334066391, -0.32871049642562866, -0.3085396885871887, -0.2883688509464264, -0.26819804310798645, -0.24802720546722412, -0.22785638272762299, -0.20768555998802185, -0.18751472234725952, -0.1673438996076584, -0.14717307686805725, -0.12700225412845612, -0.10683142393827438, -0.08666059374809265, -0.06648977100849152, -0.04631894826889038, -0.02614811807870865, -0.0059772878885269165, 0.014193594455718994, 0.03436442092061043, 0.05453524738550186, 0.0747060775756836, 0.09487690031528473, 0.11504772305488586, 0.1352185606956482, 0.15538938343524933, 0.17556020617485046, 0.1957310289144516, 0.21590185165405273, 0.23607268929481506, 0.2562435269355774, 0.27641433477401733, 0.29658517241477966, 0.316756010055542, 0.33692681789398193, 0.35709765553474426, 0.3772684633731842, 0.39743930101394653, 0.4176101088523865, 0.4377809464931488, 0.45795178413391113, 0.4781225919723511, 0.4982934296131134, 0.5184642672538757, 0.5386350750923157, 0.5588058829307556, 0.5789767503738403, 0.5991475582122803, 0.6193183660507202, 0.6394892334938049, 0.6596600413322449]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 6.0, 11.0, 9.0, 6.0, 20.0, 27.0, 28.0, 40.0, 57.0, 81.0, 124.0, 159.0, 240.0, 317.0, 419.0, 634.0, 837.0, 1259.0, 1755.0, 2495.0, 3653.0, 5295.0, 7582.0, 11319.0, 17038.0, 25676.0, 40272.0, 65027.0, 111138.0, 203062.0, 222661.0, 125419.0, 72058.0, 43966.0, 28029.0, 18545.0, 12235.0, 8187.0, 5701.0, 3929.0, 2780.0, 1949.0, 1315.0, 963.0, 657.0, 477.0, 319.0, 224.0, 168.0, 105.0, 69.0, 64.0, 67.0, 33.0, 14.0, 17.0, 12.0, 5.0, 6.0, 7.0, 2.0, 4.0], "bins": [-1.0966796875, -1.0625152587890625, -1.028350830078125, -0.9941864013671875, -0.96002197265625, -0.9258575439453125, -0.891693115234375, -0.8575286865234375, -0.8233642578125, -0.7891998291015625, -0.755035400390625, -0.7208709716796875, -0.68670654296875, -0.6525421142578125, -0.618377685546875, -0.5842132568359375, -0.550048828125, -0.5158843994140625, -0.481719970703125, -0.4475555419921875, -0.41339111328125, -0.3792266845703125, -0.345062255859375, -0.3108978271484375, -0.2767333984375, -0.2425689697265625, -0.208404541015625, -0.1742401123046875, -0.14007568359375, -0.1059112548828125, -0.071746826171875, -0.0375823974609375, -0.00341796875, 0.0307464599609375, 0.064910888671875, 0.0990753173828125, 0.13323974609375, 0.1674041748046875, 0.201568603515625, 0.2357330322265625, 0.2698974609375, 0.3040618896484375, 0.338226318359375, 0.3723907470703125, 0.40655517578125, 0.4407196044921875, 0.474884033203125, 0.5090484619140625, 0.543212890625, 0.5773773193359375, 0.611541748046875, 0.6457061767578125, 0.67987060546875, 0.7140350341796875, 0.748199462890625, 0.7823638916015625, 0.8165283203125, 0.8506927490234375, 0.884857177734375, 0.9190216064453125, 0.95318603515625, 0.9873504638671875, 1.021514892578125, 1.0556793212890625, 1.08984375]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 6.0, 1.0, 10.0, 10.0, 13.0, 14.0, 19.0, 15.0, 24.0, 16.0, 16.0, 25.0, 31.0, 36.0, 38.0, 40.0, 48.0, 47.0, 40.0, 44.0, 39.0, 36.0, 35.0, 43.0, 44.0, 42.0, 29.0, 30.0, 27.0, 34.0, 16.0, 24.0, 14.0, 18.0, 13.0, 16.0, 10.0, 3.0, 7.0, 12.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6318359375, -0.6123123168945312, -0.5927886962890625, -0.5732650756835938, -0.553741455078125, -0.5342178344726562, -0.5146942138671875, -0.49517059326171875, -0.47564697265625, -0.45612335205078125, -0.4365997314453125, -0.41707611083984375, -0.397552490234375, -0.37802886962890625, -0.3585052490234375, -0.33898162841796875, -0.3194580078125, -0.29993438720703125, -0.2804107666015625, -0.26088714599609375, -0.241363525390625, -0.22183990478515625, -0.2023162841796875, -0.18279266357421875, -0.16326904296875, -0.14374542236328125, -0.1242218017578125, -0.10469818115234375, -0.085174560546875, -0.06565093994140625, -0.0461273193359375, -0.02660369873046875, -0.007080078125, 0.01244354248046875, 0.0319671630859375, 0.05149078369140625, 0.071014404296875, 0.09053802490234375, 0.1100616455078125, 0.12958526611328125, 0.14910888671875, 0.16863250732421875, 0.1881561279296875, 0.20767974853515625, 0.227203369140625, 0.24672698974609375, 0.2662506103515625, 0.28577423095703125, 0.3052978515625, 0.32482147216796875, 0.3443450927734375, 0.36386871337890625, 0.383392333984375, 0.40291595458984375, 0.4224395751953125, 0.44196319580078125, 0.46148681640625, 0.48101043701171875, 0.5005340576171875, 0.5200576782226562, 0.539581298828125, 0.5591049194335938, 0.5786285400390625, 0.5981521606445312, 0.61767578125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 7.0, 8.0, 1.0, 6.0, 16.0, 44.0, 43.0, 66.0, 108.0, 146.0, 236.0, 336.0, 611.0, 963.0, 1603.0, 2539.0, 4414.0, 7407.0, 12779.0, 23530.0, 45192.0, 91152.0, 198017.0, 335864.0, 161211.0, 76304.0, 38173.0, 20287.0, 11248.0, 6417.0, 3789.0, 2308.0, 1354.0, 880.0, 525.0, 357.0, 208.0, 154.0, 73.0, 55.0, 42.0, 23.0, 23.0, 13.0, 9.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.6220703125, -1.5734710693359375, -1.524871826171875, -1.4762725830078125, -1.42767333984375, -1.3790740966796875, -1.330474853515625, -1.2818756103515625, -1.2332763671875, -1.1846771240234375, -1.136077880859375, -1.0874786376953125, -1.03887939453125, -0.9902801513671875, -0.941680908203125, -0.8930816650390625, -0.844482421875, -0.7958831787109375, -0.747283935546875, -0.6986846923828125, -0.65008544921875, -0.6014862060546875, -0.552886962890625, -0.5042877197265625, -0.4556884765625, -0.4070892333984375, -0.358489990234375, -0.3098907470703125, -0.26129150390625, -0.2126922607421875, -0.164093017578125, -0.1154937744140625, -0.06689453125, -0.0182952880859375, 0.030303955078125, 0.0789031982421875, 0.12750244140625, 0.1761016845703125, 0.224700927734375, 0.2733001708984375, 0.3218994140625, 0.3704986572265625, 0.419097900390625, 0.4676971435546875, 0.51629638671875, 0.5648956298828125, 0.613494873046875, 0.6620941162109375, 0.710693359375, 0.7592926025390625, 0.807891845703125, 0.8564910888671875, 0.90509033203125, 0.9536895751953125, 1.002288818359375, 1.0508880615234375, 1.0994873046875, 1.1480865478515625, 1.196685791015625, 1.2452850341796875, 1.29388427734375, 1.3424835205078125, 1.391082763671875, 1.4396820068359375, 1.48828125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 0.0, 1.0, 1.0, 4.0, 8.0, 4.0, 9.0, 11.0, 11.0, 11.0, 13.0, 11.0, 27.0, 29.0, 24.0, 27.0, 33.0, 30.0, 28.0, 36.0, 31.0, 40.0, 36.0, 48.0, 40.0, 40.0, 45.0, 40.0, 40.0, 50.0, 40.0, 37.0, 27.0, 36.0, 22.0, 21.0, 19.0, 20.0, 13.0, 12.0, 8.0, 3.0, 4.0, 3.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.45166015625, -0.4385643005371094, -0.42546844482421875, -0.4123725891113281, -0.3992767333984375, -0.3861808776855469, -0.37308502197265625, -0.3599891662597656, -0.346893310546875, -0.3337974548339844, -0.32070159912109375, -0.3076057434082031, -0.2945098876953125, -0.2814140319824219, -0.26831817626953125, -0.2552223205566406, -0.24212646484375, -0.22903060913085938, -0.21593475341796875, -0.20283889770507812, -0.1897430419921875, -0.17664718627929688, -0.16355133056640625, -0.15045547485351562, -0.137359619140625, -0.12426376342773438, -0.11116790771484375, -0.09807205200195312, -0.0849761962890625, -0.07188034057617188, -0.05878448486328125, -0.045688629150390625, -0.0325927734375, -0.019496917724609375, -0.00640106201171875, 0.006694793701171875, 0.0197906494140625, 0.032886505126953125, 0.04598236083984375, 0.059078216552734375, 0.072174072265625, 0.08526992797851562, 0.09836578369140625, 0.11146163940429688, 0.1245574951171875, 0.13765335083007812, 0.15074920654296875, 0.16384506225585938, 0.17694091796875, 0.19003677368164062, 0.20313262939453125, 0.21622848510742188, 0.2293243408203125, 0.24242019653320312, 0.25551605224609375, 0.2686119079589844, 0.281707763671875, 0.2948036193847656, 0.30789947509765625, 0.3209953308105469, 0.3340911865234375, 0.3471870422363281, 0.36028289794921875, 0.3733787536621094, 0.386474609375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 9.0, 6.0, 11.0, 20.0, 19.0, 29.0, 40.0, 65.0, 67.0, 112.0, 177.0, 225.0, 309.0, 477.0, 632.0, 943.0, 1413.0, 2000.0, 3293.0, 5848.0, 12386.0, 29970.0, 106806.0, 772297.0, 65596.0, 22484.0, 9780.0, 4898.0, 2776.0, 1818.0, 1205.0, 829.0, 626.0, 393.0, 300.0, 206.0, 134.0, 96.0, 73.0, 54.0, 42.0, 27.0, 20.0, 16.0, 6.0, 8.0, 7.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.451904296875, -0.43793487548828125, -0.4239654541015625, -0.40999603271484375, -0.396026611328125, -0.38205718994140625, -0.3680877685546875, -0.35411834716796875, -0.34014892578125, -0.32617950439453125, -0.3122100830078125, -0.29824066162109375, -0.284271240234375, -0.27030181884765625, -0.2563323974609375, -0.24236297607421875, -0.2283935546875, -0.21442413330078125, -0.2004547119140625, -0.18648529052734375, -0.172515869140625, -0.15854644775390625, -0.1445770263671875, -0.13060760498046875, -0.11663818359375, -0.10266876220703125, -0.0886993408203125, -0.07472991943359375, -0.060760498046875, -0.04679107666015625, -0.0328216552734375, -0.01885223388671875, -0.0048828125, 0.00908660888671875, 0.0230560302734375, 0.03702545166015625, 0.050994873046875, 0.06496429443359375, 0.0789337158203125, 0.09290313720703125, 0.10687255859375, 0.12084197998046875, 0.1348114013671875, 0.14878082275390625, 0.162750244140625, 0.17671966552734375, 0.1906890869140625, 0.20465850830078125, 0.2186279296875, 0.23259735107421875, 0.2465667724609375, 0.26053619384765625, 0.274505615234375, 0.28847503662109375, 0.3024444580078125, 0.31641387939453125, 0.33038330078125, 0.34435272216796875, 0.3583221435546875, 0.37229156494140625, 0.386260986328125, 0.40023040771484375, 0.4141998291015625, 0.42816925048828125, 0.442138671875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 2.0, 10.0, 4.0, 7.0, 18.0, 18.0, 24.0, 20.0, 35.0, 65.0, 93.0, 188.0, 186.0, 104.0, 57.0, 43.0, 23.0, 17.0, 13.0, 16.0, 13.0, 9.0, 8.0, 5.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0251998901367188e-05, -9.842216968536377e-06, -9.432435035705566e-06, -9.022653102874756e-06, -8.612871170043945e-06, -8.203089237213135e-06, -7.793307304382324e-06, -7.383525371551514e-06, -6.973743438720703e-06, -6.563961505889893e-06, -6.154179573059082e-06, -5.7443976402282715e-06, -5.334615707397461e-06, -4.92483377456665e-06, -4.51505184173584e-06, -4.105269908905029e-06, -3.6954879760742188e-06, -3.285706043243408e-06, -2.8759241104125977e-06, -2.466142177581787e-06, -2.0563602447509766e-06, -1.646578311920166e-06, -1.2367963790893555e-06, -8.270144462585449e-07, -4.172325134277344e-07, -7.450580596923828e-09, 4.023313522338867e-07, 8.121132850646973e-07, 1.2218952178955078e-06, 1.6316771507263184e-06, 2.041459083557129e-06, 2.4512410163879395e-06, 2.86102294921875e-06, 3.2708048820495605e-06, 3.680586814880371e-06, 4.090368747711182e-06, 4.500150680541992e-06, 4.909932613372803e-06, 5.319714546203613e-06, 5.729496479034424e-06, 6.139278411865234e-06, 6.549060344696045e-06, 6.9588422775268555e-06, 7.368624210357666e-06, 7.778406143188477e-06, 8.188188076019287e-06, 8.597970008850098e-06, 9.007751941680908e-06, 9.417533874511719e-06, 9.82731580734253e-06, 1.023709774017334e-05, 1.064687967300415e-05, 1.1056661605834961e-05, 1.1466443538665771e-05, 1.1876225471496582e-05, 1.2286007404327393e-05, 1.2695789337158203e-05, 1.3105571269989014e-05, 1.3515353202819824e-05, 1.3925135135650635e-05, 1.4334917068481445e-05, 1.4744699001312256e-05, 1.5154480934143066e-05, 1.5564262866973877e-05, 1.5974044799804688e-05]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 6.0, 2.0, 4.0, 4.0, 7.0, 11.0, 24.0, 29.0, 46.0, 46.0, 72.0, 91.0, 123.0, 147.0, 230.0, 310.0, 366.0, 476.0, 656.0, 863.0, 1181.0, 1617.0, 2412.0, 3658.0, 5860.0, 10386.0, 20233.0, 44927.0, 194931.0, 642874.0, 59364.0, 24668.0, 12572.0, 6809.0, 4059.0, 2614.0, 1756.0, 1250.0, 937.0, 715.0, 560.0, 439.0, 308.0, 225.0, 171.0, 155.0, 93.0, 79.0, 54.0, 48.0, 32.0, 14.0, 19.0, 12.0, 4.0, 11.0, 3.0, 7.0, 1.0], "bins": [-0.35302734375, -0.3426856994628906, -0.33234405517578125, -0.3220024108886719, -0.3116607666015625, -0.3013191223144531, -0.29097747802734375, -0.2806358337402344, -0.270294189453125, -0.2599525451660156, -0.24961090087890625, -0.23926925659179688, -0.2289276123046875, -0.21858596801757812, -0.20824432373046875, -0.19790267944335938, -0.18756103515625, -0.17721939086914062, -0.16687774658203125, -0.15653610229492188, -0.1461944580078125, -0.13585281372070312, -0.12551116943359375, -0.11516952514648438, -0.104827880859375, -0.09448623657226562, -0.08414459228515625, -0.07380294799804688, -0.0634613037109375, -0.053119659423828125, -0.04277801513671875, -0.032436370849609375, -0.0220947265625, -0.011753082275390625, -0.00141143798828125, 0.008930206298828125, 0.0192718505859375, 0.029613494873046875, 0.03995513916015625, 0.050296783447265625, 0.060638427734375, 0.07098007202148438, 0.08132171630859375, 0.09166336059570312, 0.1020050048828125, 0.11234664916992188, 0.12268829345703125, 0.13302993774414062, 0.14337158203125, 0.15371322631835938, 0.16405487060546875, 0.17439651489257812, 0.1847381591796875, 0.19507980346679688, 0.20542144775390625, 0.21576309204101562, 0.226104736328125, 0.23644638061523438, 0.24678802490234375, 0.2571296691894531, 0.2674713134765625, 0.2778129577636719, 0.28815460205078125, 0.2984962463378906, 0.308837890625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 6.0, 5.0, 4.0, 9.0, 11.0, 21.0, 8.0, 23.0, 22.0, 35.0, 43.0, 86.0, 383.0, 132.0, 56.0, 43.0, 24.0, 31.0, 15.0, 9.0, 12.0, 3.0, 5.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10888671875, -0.10521888732910156, -0.10155105590820312, -0.09788322448730469, -0.09421539306640625, -0.09054756164550781, -0.08687973022460938, -0.08321189880371094, -0.0795440673828125, -0.07587623596191406, -0.07220840454101562, -0.06854057312011719, -0.06487274169921875, -0.06120491027832031, -0.057537078857421875, -0.05386924743652344, -0.050201416015625, -0.04653358459472656, -0.042865753173828125, -0.03919792175292969, -0.03553009033203125, -0.03186225891113281, -0.028194427490234375, -0.024526596069335938, -0.0208587646484375, -0.017190933227539062, -0.013523101806640625, -0.009855270385742188, -0.00618743896484375, -0.0025196075439453125, 0.001148223876953125, 0.0048160552978515625, 0.00848388671875, 0.012151718139648438, 0.015819549560546875, 0.019487380981445312, 0.02315521240234375, 0.026823043823242188, 0.030490875244140625, 0.03415870666503906, 0.0378265380859375, 0.04149436950683594, 0.045162200927734375, 0.04883003234863281, 0.05249786376953125, 0.05616569519042969, 0.059833526611328125, 0.06350135803222656, 0.067169189453125, 0.07083702087402344, 0.07450485229492188, 0.07817268371582031, 0.08184051513671875, 0.08550834655761719, 0.08917617797851562, 0.09284400939941406, 0.0965118408203125, 0.10017967224121094, 0.10384750366210938, 0.10751533508300781, 0.11118316650390625, 0.11485099792480469, 0.11851882934570312, 0.12218666076660156, 0.1258544921875]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 2.0, 3.0, 5.0, 7.0, 10.0, 16.0, 12.0, 14.0, 14.0, 32.0, 19.0, 38.0, 61.0, 60.0, 96.0, 108.0, 99.0, 81.0, 67.0, 51.0, 34.0, 37.0, 23.0, 27.0, 15.0, 9.0, 11.0, 5.0, 11.0, 6.0, 6.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.845241367816925, -0.8161753416061401, -0.7871093153953552, -0.7580432891845703, -0.7289772629737854, -0.6999112367630005, -0.6708452701568604, -0.6417791843414307, -0.6127132177352905, -0.5836471915245056, -0.5545811653137207, -0.5255151391029358, -0.4964491128921509, -0.46738308668136597, -0.43831709027290344, -0.40925106406211853, -0.38018500804901123, -0.3511189818382263, -0.3220529556274414, -0.2929869294166565, -0.2639209032058716, -0.23485489189624786, -0.20578888058662415, -0.17672285437583923, -0.14765682816505432, -0.11859080195426941, -0.0895247831940651, -0.06045876443386078, -0.03139273822307587, -0.0023267120122909546, 0.026739299297332764, 0.055805325508117676, 0.08487141132354736, 0.11393743753433228, 0.1430034637451172, 0.1720694750547409, 0.20113550126552582, 0.23020152747631073, 0.25926753878593445, 0.28833356499671936, 0.3173995912075043, 0.3464656174182892, 0.3755316436290741, 0.4045976400375366, 0.43366366624832153, 0.46272969245910645, 0.49179571866989136, 0.5208617448806763, 0.5499277710914612, 0.5789937973022461, 0.608059823513031, 0.6371258497238159, 0.6661918759346008, 0.6952579021453857, 0.7243238687515259, 0.7533899545669556, 0.7824559211730957, 0.8115219473838806, 0.8405879735946655, 0.8696539998054504, 0.8987200260162354, 0.9277860522270203, 0.9568520784378052, 0.9859180450439453, 1.014984130859375]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 4.0, 4.0, 4.0, 6.0, 6.0, 14.0, 13.0, 13.0, 7.0, 16.0, 28.0, 26.0, 20.0, 22.0, 25.0, 36.0, 32.0, 32.0, 39.0, 42.0, 36.0, 36.0, 52.0, 48.0, 36.0, 33.0, 30.0, 37.0, 32.0, 30.0, 32.0, 29.0, 22.0, 19.0, 18.0, 29.0, 18.0, 15.0, 15.0, 12.0, 12.0, 5.0, 7.0, 7.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5279859304428101, -0.5085781812667847, -0.4891703724861145, -0.4697626233100891, -0.45035484433174133, -0.43094706535339355, -0.41153931617736816, -0.3921315371990204, -0.3727237582206726, -0.35331597924232483, -0.33390820026397705, -0.31450045108795166, -0.2950926721096039, -0.2756848931312561, -0.2562771439552307, -0.23686936497688293, -0.21746158599853516, -0.19805380702018738, -0.1786460429430008, -0.1592382788658142, -0.13983049988746643, -0.12042272835969925, -0.10101495683193207, -0.08160719275474548, -0.062199413776397705, -0.042791642248630524, -0.023383870720863342, -0.003976099193096161, 0.01543167233467102, 0.0348394438624382, 0.05424721539020538, 0.07365497946739197, 0.09306275844573975, 0.11247052997350693, 0.1318783015012741, 0.1512860655784607, 0.17069384455680847, 0.19010162353515625, 0.20950938761234283, 0.22891715168952942, 0.2483249306678772, 0.267732709646225, 0.28714048862457275, 0.30654823780059814, 0.3259560167789459, 0.3453637957572937, 0.3647715449333191, 0.38417932391166687, 0.40358710289001465, 0.4229948818683624, 0.4424026608467102, 0.4618104100227356, 0.4812181890010834, 0.5006259679794312, 0.5200337171554565, 0.5394414663314819, 0.5588492751121521, 0.5782570242881775, 0.5976648330688477, 0.617072582244873, 0.6364803314208984, 0.6558881402015686, 0.675295889377594, 0.6947036981582642, 0.7141114473342896]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 5.0, 8.0, 15.0, 17.0, 25.0, 29.0, 58.0, 78.0, 142.0, 200.0, 300.0, 413.0, 658.0, 1093.0, 1544.0, 2402.0, 3973.0, 6179.0, 9912.0, 16736.0, 28603.0, 49991.0, 92973.0, 188564.0, 504712.0, 1769238.0, 966231.0, 273922.0, 123794.0, 64023.0, 35509.0, 20546.0, 12279.0, 7445.0, 4475.0, 2979.0, 1827.0, 1231.0, 768.0, 495.0, 279.0, 179.0, 153.0, 91.0, 65.0, 41.0, 28.0, 21.0, 13.0, 6.0, 6.0, 3.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.83740234375, -0.8071975708007812, -0.7769927978515625, -0.7467880249023438, -0.716583251953125, -0.6863784790039062, -0.6561737060546875, -0.6259689331054688, -0.59576416015625, -0.5655593872070312, -0.5353546142578125, -0.5051498413085938, -0.474945068359375, -0.44474029541015625, -0.4145355224609375, -0.38433074951171875, -0.3541259765625, -0.32392120361328125, -0.2937164306640625, -0.26351165771484375, -0.233306884765625, -0.20310211181640625, -0.1728973388671875, -0.14269256591796875, -0.11248779296875, -0.08228302001953125, -0.0520782470703125, -0.02187347412109375, 0.008331298828125, 0.03853607177734375, 0.0687408447265625, 0.09894561767578125, 0.129150390625, 0.15935516357421875, 0.1895599365234375, 0.21976470947265625, 0.249969482421875, 0.28017425537109375, 0.3103790283203125, 0.34058380126953125, 0.37078857421875, 0.40099334716796875, 0.4311981201171875, 0.46140289306640625, 0.491607666015625, 0.5218124389648438, 0.5520172119140625, 0.5822219848632812, 0.6124267578125, 0.6426315307617188, 0.6728363037109375, 0.7030410766601562, 0.733245849609375, 0.7634506225585938, 0.7936553955078125, 0.8238601684570312, 0.85406494140625, 0.8842697143554688, 0.9144744873046875, 0.9446792602539062, 0.974884033203125, 1.0050888061523438, 1.0352935791015625, 1.0654983520507812, 1.095703125]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 6.0, 4.0, 4.0, 6.0, 7.0, 8.0, 11.0, 12.0, 9.0, 11.0, 20.0, 24.0, 17.0, 15.0, 27.0, 25.0, 29.0, 25.0, 30.0, 40.0, 38.0, 45.0, 47.0, 46.0, 42.0, 43.0, 22.0, 32.0, 35.0, 34.0, 37.0, 25.0, 34.0, 21.0, 16.0, 20.0, 25.0, 13.0, 17.0, 17.0, 11.0, 14.0, 9.0, 9.0, 6.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.3232421875, -0.3119010925292969, -0.30055999755859375, -0.2892189025878906, -0.2778778076171875, -0.2665367126464844, -0.25519561767578125, -0.24385452270507812, -0.232513427734375, -0.22117233276367188, -0.20983123779296875, -0.19849014282226562, -0.1871490478515625, -0.17580795288085938, -0.16446685791015625, -0.15312576293945312, -0.14178466796875, -0.13044357299804688, -0.11910247802734375, -0.10776138305664062, -0.0964202880859375, -0.08507919311523438, -0.07373809814453125, -0.062397003173828125, -0.051055908203125, -0.039714813232421875, -0.02837371826171875, -0.017032623291015625, -0.0056915283203125, 0.005649566650390625, 0.01699066162109375, 0.028331756591796875, 0.0396728515625, 0.051013946533203125, 0.06235504150390625, 0.07369613647460938, 0.0850372314453125, 0.09637832641601562, 0.10771942138671875, 0.11906051635742188, 0.130401611328125, 0.14174270629882812, 0.15308380126953125, 0.16442489624023438, 0.1757659912109375, 0.18710708618164062, 0.19844818115234375, 0.20978927612304688, 0.22113037109375, 0.23247146606445312, 0.24381256103515625, 0.2551536560058594, 0.2664947509765625, 0.2778358459472656, 0.28917694091796875, 0.3005180358886719, 0.311859130859375, 0.3232002258300781, 0.33454132080078125, 0.3458824157714844, 0.3572235107421875, 0.3685646057128906, 0.37990570068359375, 0.3912467956542969, 0.402587890625]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 8.0, 15.0, 18.0, 26.0, 24.0, 50.0, 64.0, 100.0, 192.0, 330.0, 487.0, 868.0, 1298.0, 2281.0, 3780.0, 6433.0, 11241.0, 19614.0, 34917.0, 63915.0, 122671.0, 251957.0, 595600.0, 1611622.0, 821664.0, 320397.0, 151155.0, 77008.0, 41382.0, 23023.0, 13033.0, 7602.0, 4436.0, 2797.0, 1615.0, 1022.0, 617.0, 394.0, 259.0, 154.0, 82.0, 55.0, 31.0, 19.0, 14.0, 9.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.7705078125, -0.7453689575195312, -0.7202301025390625, -0.6950912475585938, -0.669952392578125, -0.6448135375976562, -0.6196746826171875, -0.5945358276367188, -0.56939697265625, -0.5442581176757812, -0.5191192626953125, -0.49398040771484375, -0.468841552734375, -0.44370269775390625, -0.4185638427734375, -0.39342498779296875, -0.3682861328125, -0.34314727783203125, -0.3180084228515625, -0.29286956787109375, -0.267730712890625, -0.24259185791015625, -0.2174530029296875, -0.19231414794921875, -0.16717529296875, -0.14203643798828125, -0.1168975830078125, -0.09175872802734375, -0.066619873046875, -0.04148101806640625, -0.0163421630859375, 0.00879669189453125, 0.033935546875, 0.05907440185546875, 0.0842132568359375, 0.10935211181640625, 0.134490966796875, 0.15962982177734375, 0.1847686767578125, 0.20990753173828125, 0.23504638671875, 0.26018524169921875, 0.2853240966796875, 0.31046295166015625, 0.335601806640625, 0.36074066162109375, 0.3858795166015625, 0.41101837158203125, 0.4361572265625, 0.46129608154296875, 0.4864349365234375, 0.5115737915039062, 0.536712646484375, 0.5618515014648438, 0.5869903564453125, 0.6121292114257812, 0.63726806640625, 0.6624069213867188, 0.6875457763671875, 0.7126846313476562, 0.737823486328125, 0.7629623413085938, 0.7881011962890625, 0.8132400512695312, 0.83837890625]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 7.0, 2.0, 7.0, 12.0, 18.0, 13.0, 16.0, 26.0, 22.0, 40.0, 35.0, 64.0, 58.0, 82.0, 103.0, 113.0, 119.0, 160.0, 178.0, 197.0, 230.0, 270.0, 262.0, 266.0, 276.0, 225.0, 215.0, 190.0, 160.0, 138.0, 120.0, 99.0, 92.0, 58.0, 44.0, 31.0, 32.0, 16.0, 17.0, 18.0, 13.0, 13.0, 7.0, 7.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.23828125, -0.231475830078125, -0.22467041015625, -0.217864990234375, -0.2110595703125, -0.204254150390625, -0.19744873046875, -0.190643310546875, -0.183837890625, -0.177032470703125, -0.17022705078125, -0.163421630859375, -0.1566162109375, -0.149810791015625, -0.14300537109375, -0.136199951171875, -0.12939453125, -0.122589111328125, -0.11578369140625, -0.108978271484375, -0.1021728515625, -0.095367431640625, -0.08856201171875, -0.081756591796875, -0.074951171875, -0.068145751953125, -0.06134033203125, -0.054534912109375, -0.0477294921875, -0.040924072265625, -0.03411865234375, -0.027313232421875, -0.0205078125, -0.013702392578125, -0.00689697265625, -9.1552734375e-05, 0.0067138671875, 0.013519287109375, 0.02032470703125, 0.027130126953125, 0.033935546875, 0.040740966796875, 0.04754638671875, 0.054351806640625, 0.0611572265625, 0.067962646484375, 0.07476806640625, 0.081573486328125, 0.08837890625, 0.095184326171875, 0.10198974609375, 0.108795166015625, 0.1156005859375, 0.122406005859375, 0.12921142578125, 0.136016845703125, 0.142822265625, 0.149627685546875, 0.15643310546875, 0.163238525390625, 0.1700439453125, 0.176849365234375, 0.18365478515625, 0.190460205078125, 0.197265625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 4.0, 8.0, 3.0, 7.0, 6.0, 6.0, 11.0, 16.0, 14.0, 13.0, 21.0, 28.0, 31.0, 43.0, 47.0, 68.0, 76.0, 116.0, 79.0, 65.0, 55.0, 47.0, 45.0, 25.0, 37.0, 21.0, 24.0, 7.0, 10.0, 14.0, 8.0, 6.0, 8.0, 6.0, 4.0, 3.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.5690144300460815, -0.5512574315071106, -0.5335004925727844, -0.5157434940338135, -0.4979865550994873, -0.48022955656051636, -0.4624725878238678, -0.44471561908721924, -0.4269586503505707, -0.4092016816139221, -0.39144471287727356, -0.373687744140625, -0.35593074560165405, -0.3381738066673279, -0.32041680812835693, -0.3026598393917084, -0.2849028706550598, -0.26714590191841125, -0.2493889331817627, -0.23163194954395294, -0.21387498080730438, -0.19611801207065582, -0.17836102843284607, -0.1606040596961975, -0.14284709095954895, -0.1250901222229004, -0.10733314603567123, -0.08957616984844208, -0.07181920111179352, -0.05406223237514496, -0.0363052561879158, -0.018548280000686646, -0.0007913112640380859, 0.016965661197900772, 0.03472263365983963, 0.05247960612177849, 0.07023657858371735, 0.0879935473203659, 0.10575052350759506, 0.12350749969482422, 0.14126446843147278, 0.15902143716812134, 0.1767784059047699, 0.19453538954257965, 0.2122923582792282, 0.23004932701587677, 0.24780631065368652, 0.2655632793903351, 0.28332024812698364, 0.3010772168636322, 0.31883418560028076, 0.3365911543369293, 0.3543481230735779, 0.37210512161254883, 0.3898620903491974, 0.40761905908584595, 0.4253760278224945, 0.44313299655914307, 0.4608899652957916, 0.4786469340324402, 0.49640393257141113, 0.5141608715057373, 0.5319178700447083, 0.5496748685836792, 0.5674318075180054]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 3.0, 7.0, 3.0, 0.0, 9.0, 6.0, 8.0, 11.0, 13.0, 12.0, 15.0, 15.0, 15.0, 21.0, 22.0, 24.0, 27.0, 26.0, 37.0, 28.0, 40.0, 37.0, 36.0, 33.0, 39.0, 47.0, 41.0, 32.0, 36.0, 39.0, 37.0, 32.0, 30.0, 25.0, 22.0, 28.0, 20.0, 17.0, 19.0, 20.0, 9.0, 18.0, 8.0, 9.0, 5.0, 8.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.37645992636680603, -0.3636062741279602, -0.350752592086792, -0.3378989100456238, -0.32504525780677795, -0.31219160556793213, -0.2993379235267639, -0.2864842414855957, -0.2736305892467499, -0.26077693700790405, -0.24792325496673584, -0.23506958782672882, -0.2222159206867218, -0.20936225354671478, -0.19650858640670776, -0.18365491926670074, -0.17080125212669373, -0.1579475849866867, -0.1450939178466797, -0.13224025070667267, -0.11938658356666565, -0.10653291642665863, -0.09367924928665161, -0.08082558214664459, -0.06797191500663757, -0.055118247866630554, -0.042264580726623535, -0.029410913586616516, -0.016557246446609497, -0.003703579306602478, 0.009150087833404541, 0.02200375497341156, 0.03485742211341858, 0.0477110892534256, 0.06056475639343262, 0.07341842353343964, 0.08627209067344666, 0.09912575781345367, 0.1119794249534607, 0.12483309209346771, 0.13768675923347473, 0.15054042637348175, 0.16339409351348877, 0.1762477606534958, 0.1891014277935028, 0.20195509493350983, 0.21480876207351685, 0.22766242921352386, 0.24051609635353088, 0.2533697485923767, 0.2662234306335449, 0.27907711267471313, 0.29193076491355896, 0.3047844171524048, 0.317638099193573, 0.3304917812347412, 0.34334543347358704, 0.35619908571243286, 0.3690527677536011, 0.3819064497947693, 0.3947601020336151, 0.40761375427246094, 0.42046743631362915, 0.43332111835479736, 0.4461747705936432]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 10.0, 12.0, 15.0, 18.0, 21.0, 34.0, 42.0, 61.0, 98.0, 135.0, 179.0, 291.0, 373.0, 572.0, 827.0, 1127.0, 1798.0, 2612.0, 4024.0, 6260.0, 9317.0, 15079.0, 24698.0, 41702.0, 73715.0, 140205.0, 290086.0, 198136.0, 98402.0, 54032.0, 31410.0, 19148.0, 11807.0, 7461.0, 4918.0, 3213.0, 2041.0, 1442.0, 1020.0, 681.0, 464.0, 315.0, 224.0, 144.0, 117.0, 79.0, 56.0, 46.0, 23.0, 20.0, 25.0, 14.0, 3.0, 7.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.1463623046875, -0.14175033569335938, -0.13713836669921875, -0.13252639770507812, -0.1279144287109375, -0.12330245971679688, -0.11869049072265625, -0.11407852172851562, -0.109466552734375, -0.10485458374023438, -0.10024261474609375, -0.09563064575195312, -0.0910186767578125, -0.08640670776367188, -0.08179473876953125, -0.07718276977539062, -0.07257080078125, -0.06795883178710938, -0.06334686279296875, -0.058734893798828125, -0.0541229248046875, -0.049510955810546875, -0.04489898681640625, -0.040287017822265625, -0.035675048828125, -0.031063079833984375, -0.02645111083984375, -0.021839141845703125, -0.0172271728515625, -0.012615203857421875, -0.00800323486328125, -0.003391265869140625, 0.001220703125, 0.005832672119140625, 0.01044464111328125, 0.015056610107421875, 0.0196685791015625, 0.024280548095703125, 0.02889251708984375, 0.033504486083984375, 0.038116455078125, 0.042728424072265625, 0.04734039306640625, 0.051952362060546875, 0.0565643310546875, 0.061176300048828125, 0.06578826904296875, 0.07040023803710938, 0.07501220703125, 0.07962417602539062, 0.08423614501953125, 0.08884811401367188, 0.0934600830078125, 0.09807205200195312, 0.10268402099609375, 0.10729598999023438, 0.111907958984375, 0.11651992797851562, 0.12113189697265625, 0.12574386596679688, 0.1303558349609375, 0.13496780395507812, 0.13957977294921875, 0.14419174194335938, 0.1488037109375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 6.0, 5.0, 2.0, 9.0, 14.0, 7.0, 8.0, 14.0, 23.0, 15.0, 16.0, 18.0, 27.0, 28.0, 25.0, 33.0, 46.0, 39.0, 33.0, 36.0, 33.0, 50.0, 49.0, 46.0, 43.0, 44.0, 43.0, 26.0, 34.0, 27.0, 26.0, 29.0, 17.0, 17.0, 16.0, 14.0, 14.0, 17.0, 15.0, 11.0, 6.0, 3.0, 5.0, 3.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.4248046875, -0.4106788635253906, -0.39655303955078125, -0.3824272155761719, -0.3683013916015625, -0.3541755676269531, -0.34004974365234375, -0.3259239196777344, -0.311798095703125, -0.2976722717285156, -0.28354644775390625, -0.2694206237792969, -0.2552947998046875, -0.24116897583007812, -0.22704315185546875, -0.21291732788085938, -0.19879150390625, -0.18466567993164062, -0.17053985595703125, -0.15641403198242188, -0.1422882080078125, -0.12816238403320312, -0.11403656005859375, -0.09991073608398438, -0.085784912109375, -0.07165908813476562, -0.05753326416015625, -0.043407440185546875, -0.0292816162109375, -0.015155792236328125, -0.00102996826171875, 0.013095855712890625, 0.0272216796875, 0.041347503662109375, 0.05547332763671875, 0.06959915161132812, 0.0837249755859375, 0.09785079956054688, 0.11197662353515625, 0.12610244750976562, 0.140228271484375, 0.15435409545898438, 0.16847991943359375, 0.18260574340820312, 0.1967315673828125, 0.21085739135742188, 0.22498321533203125, 0.23910903930664062, 0.25323486328125, 0.2673606872558594, 0.28148651123046875, 0.2956123352050781, 0.3097381591796875, 0.3238639831542969, 0.33798980712890625, 0.3521156311035156, 0.366241455078125, 0.3803672790527344, 0.39449310302734375, 0.4086189270019531, 0.4227447509765625, 0.4368705749511719, 0.45099639892578125, 0.4651222229003906, 0.479248046875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 10.0, 14.0, 20.0, 24.0, 35.0, 51.0, 76.0, 118.0, 159.0, 230.0, 333.0, 497.0, 795.0, 1161.0, 1866.0, 3067.0, 5108.0, 8739.0, 15705.0, 30439.0, 68192.0, 192771.0, 460890.0, 143986.0, 55253.0, 25952.0, 13549.0, 7549.0, 4334.0, 2730.0, 1718.0, 1041.0, 725.0, 443.0, 312.0, 200.0, 137.0, 81.0, 71.0, 52.0, 41.0, 14.0, 21.0, 17.0, 8.0, 8.0, 6.0, 2.0, 4.0, 6.0, 0.0, 0.0, 2.0], "bins": [-0.252685546875, -0.2451152801513672, -0.23754501342773438, -0.22997474670410156, -0.22240447998046875, -0.21483421325683594, -0.20726394653320312, -0.1996936798095703, -0.1921234130859375, -0.1845531463623047, -0.17698287963867188, -0.16941261291503906, -0.16184234619140625, -0.15427207946777344, -0.14670181274414062, -0.1391315460205078, -0.131561279296875, -0.12399101257324219, -0.11642074584960938, -0.10885047912597656, -0.10128021240234375, -0.09370994567871094, -0.08613967895507812, -0.07856941223144531, -0.0709991455078125, -0.06342887878417969, -0.055858612060546875, -0.04828834533691406, -0.04071807861328125, -0.03314781188964844, -0.025577545166015625, -0.018007278442382812, -0.01043701171875, -0.0028667449951171875, 0.004703521728515625, 0.012273788452148438, 0.01984405517578125, 0.027414321899414062, 0.034984588623046875, 0.04255485534667969, 0.0501251220703125, 0.05769538879394531, 0.06526565551757812, 0.07283592224121094, 0.08040618896484375, 0.08797645568847656, 0.09554672241210938, 0.10311698913574219, 0.110687255859375, 0.11825752258300781, 0.12582778930664062, 0.13339805603027344, 0.14096832275390625, 0.14853858947753906, 0.15610885620117188, 0.1636791229248047, 0.1712493896484375, 0.1788196563720703, 0.18638992309570312, 0.19396018981933594, 0.20153045654296875, 0.20910072326660156, 0.21667098999023438, 0.2242412567138672, 0.2318115234375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 4.0, 0.0, 9.0, 11.0, 9.0, 8.0, 9.0, 12.0, 19.0, 20.0, 25.0, 29.0, 31.0, 36.0, 33.0, 37.0, 36.0, 42.0, 48.0, 36.0, 44.0, 55.0, 54.0, 33.0, 43.0, 44.0, 34.0, 32.0, 31.0, 15.0, 40.0, 28.0, 12.0, 16.0, 10.0, 12.0, 9.0, 6.0, 1.0, 7.0, 2.0, 5.0, 1.0, 3.0, 7.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.322509765625, -0.3129310607910156, -0.30335235595703125, -0.2937736511230469, -0.2841949462890625, -0.2746162414550781, -0.26503753662109375, -0.2554588317871094, -0.245880126953125, -0.23630142211914062, -0.22672271728515625, -0.21714401245117188, -0.2075653076171875, -0.19798660278320312, -0.18840789794921875, -0.17882919311523438, -0.16925048828125, -0.15967178344726562, -0.15009307861328125, -0.14051437377929688, -0.1309356689453125, -0.12135696411132812, -0.11177825927734375, -0.10219955444335938, -0.092620849609375, -0.08304214477539062, -0.07346343994140625, -0.06388473510742188, -0.0543060302734375, -0.044727325439453125, -0.03514862060546875, -0.025569915771484375, -0.0159912109375, -0.006412506103515625, 0.00316619873046875, 0.012744903564453125, 0.0223236083984375, 0.031902313232421875, 0.04148101806640625, 0.051059722900390625, 0.060638427734375, 0.07021713256835938, 0.07979583740234375, 0.08937454223632812, 0.0989532470703125, 0.10853195190429688, 0.11811065673828125, 0.12768936157226562, 0.13726806640625, 0.14684677124023438, 0.15642547607421875, 0.16600418090820312, 0.1755828857421875, 0.18516159057617188, 0.19474029541015625, 0.20431900024414062, 0.213897705078125, 0.22347640991210938, 0.23305511474609375, 0.24263381958007812, 0.2522125244140625, 0.2617912292480469, 0.27136993408203125, 0.2809486389160156, 0.29052734375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 4.0, 4.0, 3.0, 3.0, 2.0, 6.0, 6.0, 16.0, 19.0, 31.0, 25.0, 41.0, 70.0, 67.0, 132.0, 176.0, 282.0, 370.0, 593.0, 959.0, 1632.0, 3036.0, 6212.0, 14611.0, 46177.0, 506444.0, 395893.0, 44223.0, 14244.0, 5935.0, 2970.0, 1619.0, 975.0, 562.0, 380.0, 241.0, 160.0, 120.0, 92.0, 59.0, 49.0, 29.0, 25.0, 15.0, 12.0, 11.0, 12.0, 6.0, 7.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.03607177734375, -0.034827232360839844, -0.03358268737792969, -0.03233814239501953, -0.031093597412109375, -0.02984905242919922, -0.028604507446289062, -0.027359962463378906, -0.02611541748046875, -0.024870872497558594, -0.023626327514648438, -0.02238178253173828, -0.021137237548828125, -0.01989269256591797, -0.018648147583007812, -0.017403602600097656, -0.0161590576171875, -0.014914512634277344, -0.013669967651367188, -0.012425422668457031, -0.011180877685546875, -0.009936332702636719, -0.008691787719726562, -0.007447242736816406, -0.00620269775390625, -0.004958152770996094, -0.0037136077880859375, -0.0024690628051757812, -0.001224517822265625, 2.002716064453125e-05, 0.0012645721435546875, 0.0025091171264648438, 0.003753662109375, 0.004998207092285156, 0.0062427520751953125, 0.007487297058105469, 0.008731842041015625, 0.009976387023925781, 0.011220932006835938, 0.012465476989746094, 0.01371002197265625, 0.014954566955566406, 0.016199111938476562, 0.01744365692138672, 0.018688201904296875, 0.01993274688720703, 0.021177291870117188, 0.022421836853027344, 0.0236663818359375, 0.024910926818847656, 0.026155471801757812, 0.02740001678466797, 0.028644561767578125, 0.02988910675048828, 0.031133651733398438, 0.032378196716308594, 0.03362274169921875, 0.034867286682128906, 0.03611183166503906, 0.03735637664794922, 0.038600921630859375, 0.03984546661376953, 0.04109001159667969, 0.042334556579589844, 0.0435791015625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 3.0, 2.0, 13.0, 14.0, 21.0, 28.0, 27.0, 61.0, 90.0, 90.0, 128.0, 60.0, 110.0, 89.0, 72.0, 63.0, 39.0, 10.0, 13.0, 17.0, 13.0, 10.0, 3.0, 7.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.3974647521972656e-06, -3.28943133354187e-06, -3.1813979148864746e-06, -3.073364496231079e-06, -2.9653310775756836e-06, -2.857297658920288e-06, -2.7492642402648926e-06, -2.641230821609497e-06, -2.5331974029541016e-06, -2.425163984298706e-06, -2.3171305656433105e-06, -2.209097146987915e-06, -2.1010637283325195e-06, -1.993030309677124e-06, -1.8849968910217285e-06, -1.776963472366333e-06, -1.6689300537109375e-06, -1.560896635055542e-06, -1.4528632164001465e-06, -1.344829797744751e-06, -1.2367963790893555e-06, -1.12876296043396e-06, -1.0207295417785645e-06, -9.126961231231689e-07, -8.046627044677734e-07, -6.966292858123779e-07, -5.885958671569824e-07, -4.805624485015869e-07, -3.725290298461914e-07, -2.644956111907959e-07, -1.564621925354004e-07, -4.842877388000488e-08, 5.960464477539063e-08, 1.6763806343078613e-07, 2.7567148208618164e-07, 3.8370490074157715e-07, 4.917383193969727e-07, 5.997717380523682e-07, 7.078051567077637e-07, 8.158385753631592e-07, 9.238719940185547e-07, 1.0319054126739502e-06, 1.1399388313293457e-06, 1.2479722499847412e-06, 1.3560056686401367e-06, 1.4640390872955322e-06, 1.5720725059509277e-06, 1.6801059246063232e-06, 1.7881393432617188e-06, 1.8961727619171143e-06, 2.0042061805725098e-06, 2.1122395992279053e-06, 2.2202730178833008e-06, 2.3283064365386963e-06, 2.436339855194092e-06, 2.5443732738494873e-06, 2.652406692504883e-06, 2.7604401111602783e-06, 2.868473529815674e-06, 2.9765069484710693e-06, 3.084540367126465e-06, 3.1925737857818604e-06, 3.300607204437256e-06, 3.4086406230926514e-06, 3.516674041748047e-06]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 16.0, 10.0, 24.0, 30.0, 33.0, 49.0, 71.0, 80.0, 119.0, 152.0, 230.0, 297.0, 426.0, 700.0, 1154.0, 1999.0, 3676.0, 7432.0, 15991.0, 41160.0, 160762.0, 669692.0, 90410.0, 28657.0, 12086.0, 5895.0, 2859.0, 1616.0, 940.0, 572.0, 399.0, 258.0, 218.0, 147.0, 116.0, 75.0, 57.0, 39.0, 44.0, 23.0, 20.0, 13.0, 8.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.04248046875, -0.04116630554199219, -0.039852142333984375, -0.03853797912597656, -0.03722381591796875, -0.03590965270996094, -0.034595489501953125, -0.03328132629394531, -0.0319671630859375, -0.030652999877929688, -0.029338836669921875, -0.028024673461914062, -0.02671051025390625, -0.025396347045898438, -0.024082183837890625, -0.022768020629882812, -0.021453857421875, -0.020139694213867188, -0.018825531005859375, -0.017511367797851562, -0.01619720458984375, -0.014883041381835938, -0.013568878173828125, -0.012254714965820312, -0.0109405517578125, -0.009626388549804688, -0.008312225341796875, -0.0069980621337890625, -0.00568389892578125, -0.0043697357177734375, -0.003055572509765625, -0.0017414093017578125, -0.00042724609375, 0.0008869171142578125, 0.002201080322265625, 0.0035152435302734375, 0.00482940673828125, 0.0061435699462890625, 0.007457733154296875, 0.008771896362304688, 0.0100860595703125, 0.011400222778320312, 0.012714385986328125, 0.014028549194335938, 0.01534271240234375, 0.016656875610351562, 0.017971038818359375, 0.019285202026367188, 0.020599365234375, 0.021913528442382812, 0.023227691650390625, 0.024541854858398438, 0.02585601806640625, 0.027170181274414062, 0.028484344482421875, 0.029798507690429688, 0.0311126708984375, 0.03242683410644531, 0.033740997314453125, 0.03505516052246094, 0.03636932373046875, 0.03768348693847656, 0.038997650146484375, 0.04031181335449219, 0.0416259765625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 5.0, 8.0, 4.0, 6.0, 9.0, 6.0, 14.0, 16.0, 15.0, 19.0, 23.0, 19.0, 29.0, 34.0, 48.0, 65.0, 84.0, 192.0, 107.0, 54.0, 37.0, 33.0, 35.0, 20.0, 16.0, 13.0, 13.0, 8.0, 15.0, 9.0, 5.0, 9.0, 5.0, 2.0, 8.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00855255126953125, -0.008295297622680664, -0.008038043975830078, -0.007780790328979492, -0.007523536682128906, -0.00726628303527832, -0.007009029388427734, -0.0067517757415771484, -0.0064945220947265625, -0.0062372684478759766, -0.005980014801025391, -0.005722761154174805, -0.005465507507324219, -0.005208253860473633, -0.004951000213623047, -0.004693746566772461, -0.004436492919921875, -0.004179239273071289, -0.003921985626220703, -0.003664731979370117, -0.0034074783325195312, -0.0031502246856689453, -0.0028929710388183594, -0.0026357173919677734, -0.0023784637451171875, -0.0021212100982666016, -0.0018639564514160156, -0.0016067028045654297, -0.0013494491577148438, -0.0010921955108642578, -0.0008349418640136719, -0.0005776882171630859, -0.0003204345703125, -6.318092346191406e-05, 0.00019407272338867188, 0.0004513263702392578, 0.0007085800170898438, 0.0009658336639404297, 0.0012230873107910156, 0.0014803409576416016, 0.0017375946044921875, 0.0019948482513427734, 0.0022521018981933594, 0.0025093555450439453, 0.0027666091918945312, 0.003023862838745117, 0.003281116485595703, 0.003538370132446289, 0.003795623779296875, 0.004052877426147461, 0.004310131072998047, 0.004567384719848633, 0.004824638366699219, 0.005081892013549805, 0.005339145660400391, 0.0055963993072509766, 0.0058536529541015625, 0.0061109066009521484, 0.006368160247802734, 0.00662541389465332, 0.006882667541503906, 0.007139921188354492, 0.007397174835205078, 0.007654428482055664, 0.00791168212890625]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 4.0, 8.0, 6.0, 4.0, 6.0, 3.0, 12.0, 14.0, 11.0, 16.0, 21.0, 26.0, 31.0, 38.0, 44.0, 63.0, 73.0, 109.0, 86.0, 77.0, 53.0, 45.0, 49.0, 35.0, 26.0, 26.0, 27.0, 10.0, 14.0, 7.0, 8.0, 10.0, 7.0, 6.0, 6.0, 3.0, 4.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.5731640458106995, -0.5554251074790955, -0.5376861691474915, -0.5199471712112427, -0.5022082328796387, -0.48446929454803467, -0.46673035621643066, -0.44899141788482666, -0.43125244975090027, -0.41351351141929626, -0.3957745432853699, -0.37803560495376587, -0.36029666662216187, -0.3425576984882355, -0.32481876015663147, -0.3070797920227051, -0.2893408536911011, -0.27160191535949707, -0.2538629472255707, -0.23612400889396667, -0.21838505566120148, -0.20064610242843628, -0.18290716409683228, -0.16516821086406708, -0.14742925763130188, -0.12969030439853668, -0.11195135861635208, -0.09421241283416748, -0.07647345960140228, -0.058734506368637085, -0.040995560586452484, -0.023256614804267883, -0.00551760196685791, 0.01222134754061699, 0.02996029704809189, 0.04769924655556679, 0.06543819606304169, 0.08317714929580688, 0.10091609507799149, 0.11865504086017609, 0.13639399409294128, 0.15413294732570648, 0.17187190055847168, 0.18961083889007568, 0.20734979212284088, 0.22508874535560608, 0.24282768368721008, 0.2605666518211365, 0.2783055901527405, 0.2960445284843445, 0.3137834966182709, 0.3315224349498749, 0.34926140308380127, 0.3670003414154053, 0.3847392797470093, 0.4024782180786133, 0.4202171862125397, 0.4379561245441437, 0.45569509267807007, 0.4734340310096741, 0.4911729693412781, 0.5089119672775269, 0.5266509056091309, 0.5443898439407349, 0.5621287822723389]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 4.0, 2.0, 6.0, 7.0, 7.0, 11.0, 14.0, 13.0, 11.0, 17.0, 18.0, 19.0, 19.0, 28.0, 26.0, 26.0, 34.0, 30.0, 40.0, 37.0, 37.0, 33.0, 36.0, 52.0, 38.0, 32.0, 41.0, 36.0, 38.0, 31.0, 29.0, 27.0, 24.0, 24.0, 21.0, 15.0, 19.0, 19.0, 10.0, 17.0, 10.0, 9.0, 7.0, 6.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.3772164285182953, -0.3643534183502197, -0.35149040818214417, -0.3386273980140686, -0.32576441764831543, -0.31290140748023987, -0.3000383973121643, -0.28717538714408875, -0.2743123769760132, -0.2614493668079376, -0.24858637154102325, -0.2357233613729477, -0.22286036610603333, -0.20999735593795776, -0.1971343457698822, -0.18427133560180664, -0.17140835523605347, -0.1585453450679779, -0.14568234980106354, -0.13281933963298798, -0.11995633691549301, -0.10709333419799805, -0.09423032402992249, -0.08136732131242752, -0.06850431859493256, -0.05564131587743759, -0.04277830943465233, -0.029915302991867065, -0.0170523002743721, -0.004189297556877136, 0.008673712611198425, 0.02153671532869339, 0.03439974784851074, 0.04726275056600571, 0.06012575700879097, 0.07298876345157623, 0.0858517661690712, 0.09871476888656616, 0.11157777905464172, 0.12444078177213669, 0.13730378448963165, 0.15016679465770721, 0.16302978992462158, 0.17589280009269714, 0.1887558102607727, 0.20161880552768707, 0.21448181569576263, 0.227344810962677, 0.24020782113075256, 0.2530708312988281, 0.2659338414669037, 0.27879685163497925, 0.2916598320007324, 0.304522842168808, 0.31738585233688354, 0.3302488625049591, 0.34311187267303467, 0.35597488284111023, 0.3688378930091858, 0.38170087337493896, 0.3945638835430145, 0.4074268937110901, 0.42028990387916565, 0.4331529140472412, 0.4460158944129944]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 22.0, 25.0, 36.0, 48.0, 80.0, 117.0, 150.0, 215.0, 318.0, 466.0, 655.0, 950.0, 1393.0, 2075.0, 3019.0, 4378.0, 6578.0, 9867.0, 14997.0, 23412.0, 37933.0, 62632.0, 109285.0, 220860.0, 245802.0, 120845.0, 68180.0, 40320.0, 25321.0, 16274.0, 10628.0, 6880.0, 4694.0, 3102.0, 2213.0, 1479.0, 1053.0, 692.0, 489.0, 321.0, 238.0, 170.0, 102.0, 77.0, 48.0, 39.0, 29.0, 17.0, 12.0, 5.0, 5.0, 4.0, 0.0, 2.0], "bins": [-0.876953125, -0.8512191772460938, -0.8254852294921875, -0.7997512817382812, -0.774017333984375, -0.7482833862304688, -0.7225494384765625, -0.6968154907226562, -0.67108154296875, -0.6453475952148438, -0.6196136474609375, -0.5938796997070312, -0.568145751953125, -0.5424118041992188, -0.5166778564453125, -0.49094390869140625, -0.4652099609375, -0.43947601318359375, -0.4137420654296875, -0.38800811767578125, -0.362274169921875, -0.33654022216796875, -0.3108062744140625, -0.28507232666015625, -0.25933837890625, -0.23360443115234375, -0.2078704833984375, -0.18213653564453125, -0.156402587890625, -0.13066864013671875, -0.1049346923828125, -0.07920074462890625, -0.053466796875, -0.02773284912109375, -0.0019989013671875, 0.02373504638671875, 0.049468994140625, 0.07520294189453125, 0.1009368896484375, 0.12667083740234375, 0.15240478515625, 0.17813873291015625, 0.2038726806640625, 0.22960662841796875, 0.255340576171875, 0.28107452392578125, 0.3068084716796875, 0.33254241943359375, 0.3582763671875, 0.38401031494140625, 0.4097442626953125, 0.43547821044921875, 0.461212158203125, 0.48694610595703125, 0.5126800537109375, 0.5384140014648438, 0.56414794921875, 0.5898818969726562, 0.6156158447265625, 0.6413497924804688, 0.667083740234375, 0.6928176879882812, 0.7185516357421875, 0.7442855834960938, 0.77001953125]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 3.0, 6.0, 4.0, 5.0, 9.0, 10.0, 19.0, 13.0, 19.0, 18.0, 23.0, 28.0, 30.0, 35.0, 24.0, 40.0, 45.0, 40.0, 29.0, 44.0, 45.0, 53.0, 46.0, 44.0, 32.0, 38.0, 42.0, 25.0, 22.0, 35.0, 23.0, 24.0, 20.0, 15.0, 19.0, 14.0, 13.0, 9.0, 5.0, 8.0, 4.0, 5.0, 3.0, 7.0, 0.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.386474609375, -0.37319183349609375, -0.3599090576171875, -0.34662628173828125, -0.333343505859375, -0.32006072998046875, -0.3067779541015625, -0.29349517822265625, -0.28021240234375, -0.26692962646484375, -0.2536468505859375, -0.24036407470703125, -0.227081298828125, -0.21379852294921875, -0.2005157470703125, -0.18723297119140625, -0.1739501953125, -0.16066741943359375, -0.1473846435546875, -0.13410186767578125, -0.120819091796875, -0.10753631591796875, -0.0942535400390625, -0.08097076416015625, -0.06768798828125, -0.05440521240234375, -0.0411224365234375, -0.02783966064453125, -0.014556884765625, -0.00127410888671875, 0.0120086669921875, 0.02529144287109375, 0.03857421875, 0.05185699462890625, 0.0651397705078125, 0.07842254638671875, 0.091705322265625, 0.10498809814453125, 0.1182708740234375, 0.13155364990234375, 0.14483642578125, 0.15811920166015625, 0.1714019775390625, 0.18468475341796875, 0.197967529296875, 0.21125030517578125, 0.2245330810546875, 0.23781585693359375, 0.2510986328125, 0.26438140869140625, 0.2776641845703125, 0.29094696044921875, 0.304229736328125, 0.31751251220703125, 0.3307952880859375, 0.34407806396484375, 0.35736083984375, 0.37064361572265625, 0.3839263916015625, 0.39720916748046875, 0.410491943359375, 0.42377471923828125, 0.4370574951171875, 0.45034027099609375, 0.463623046875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 5.0, 5.0, 9.0, 6.0, 19.0, 31.0, 38.0, 61.0, 87.0, 137.0, 187.0, 310.0, 439.0, 650.0, 1126.0, 1770.0, 2815.0, 4525.0, 7320.0, 12288.0, 20196.0, 34061.0, 58896.0, 110224.0, 245656.0, 271823.0, 120618.0, 63749.0, 36216.0, 21498.0, 12904.0, 7781.0, 4884.0, 3048.0, 1846.0, 1173.0, 765.0, 453.0, 335.0, 209.0, 132.0, 102.0, 55.0, 37.0, 24.0, 15.0, 15.0, 7.0, 7.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.9970703125, -0.965972900390625, -0.93487548828125, -0.903778076171875, -0.8726806640625, -0.841583251953125, -0.81048583984375, -0.779388427734375, -0.748291015625, -0.717193603515625, -0.68609619140625, -0.654998779296875, -0.6239013671875, -0.592803955078125, -0.56170654296875, -0.530609130859375, -0.49951171875, -0.468414306640625, -0.43731689453125, -0.406219482421875, -0.3751220703125, -0.344024658203125, -0.31292724609375, -0.281829833984375, -0.250732421875, -0.219635009765625, -0.18853759765625, -0.157440185546875, -0.1263427734375, -0.095245361328125, -0.06414794921875, -0.033050537109375, -0.001953125, 0.029144287109375, 0.06024169921875, 0.091339111328125, 0.1224365234375, 0.153533935546875, 0.18463134765625, 0.215728759765625, 0.246826171875, 0.277923583984375, 0.30902099609375, 0.340118408203125, 0.3712158203125, 0.402313232421875, 0.43341064453125, 0.464508056640625, 0.49560546875, 0.526702880859375, 0.55780029296875, 0.588897705078125, 0.6199951171875, 0.651092529296875, 0.68218994140625, 0.713287353515625, 0.744384765625, 0.775482177734375, 0.80657958984375, 0.837677001953125, 0.8687744140625, 0.899871826171875, 0.93096923828125, 0.962066650390625, 0.9931640625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 10.0, 12.0, 10.0, 6.0, 15.0, 12.0, 13.0, 20.0, 21.0, 31.0, 28.0, 41.0, 31.0, 36.0, 26.0, 38.0, 42.0, 45.0, 54.0, 37.0, 42.0, 46.0, 32.0, 32.0, 45.0, 36.0, 29.0, 28.0, 17.0, 22.0, 27.0, 15.0, 24.0, 21.0, 8.0, 10.0, 4.0, 5.0, 11.0, 7.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.272216796875, -0.26337432861328125, -0.2545318603515625, -0.24568939208984375, -0.236846923828125, -0.22800445556640625, -0.2191619873046875, -0.21031951904296875, -0.20147705078125, -0.19263458251953125, -0.1837921142578125, -0.17494964599609375, -0.166107177734375, -0.15726470947265625, -0.1484222412109375, -0.13957977294921875, -0.1307373046875, -0.12189483642578125, -0.1130523681640625, -0.10420989990234375, -0.095367431640625, -0.08652496337890625, -0.0776824951171875, -0.06884002685546875, -0.05999755859375, -0.05115509033203125, -0.0423126220703125, -0.03347015380859375, -0.024627685546875, -0.01578521728515625, -0.0069427490234375, 0.00189971923828125, 0.0107421875, 0.01958465576171875, 0.0284271240234375, 0.03726959228515625, 0.046112060546875, 0.05495452880859375, 0.0637969970703125, 0.07263946533203125, 0.08148193359375, 0.09032440185546875, 0.0991668701171875, 0.10800933837890625, 0.116851806640625, 0.12569427490234375, 0.1345367431640625, 0.14337921142578125, 0.1522216796875, 0.16106414794921875, 0.1699066162109375, 0.17874908447265625, 0.187591552734375, 0.19643402099609375, 0.2052764892578125, 0.21411895751953125, 0.22296142578125, 0.23180389404296875, 0.2406463623046875, 0.24948883056640625, 0.258331298828125, 0.26717376708984375, 0.2760162353515625, 0.28485870361328125, 0.293701171875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 11.0, 11.0, 15.0, 26.0, 32.0, 38.0, 49.0, 77.0, 97.0, 145.0, 188.0, 228.0, 323.0, 406.0, 635.0, 801.0, 1119.0, 1617.0, 2253.0, 3486.0, 5577.0, 9569.0, 18658.0, 42184.0, 214265.0, 645404.0, 50899.0, 21181.0, 10884.0, 6016.0, 3667.0, 2506.0, 1748.0, 1224.0, 850.0, 595.0, 428.0, 376.0, 247.0, 199.0, 143.0, 103.0, 82.0, 49.0, 48.0, 32.0, 16.0, 19.0, 16.0, 6.0, 7.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1202392578125, -0.11649227142333984, -0.11274528503417969, -0.10899829864501953, -0.10525131225585938, -0.10150432586669922, -0.09775733947753906, -0.0940103530883789, -0.09026336669921875, -0.0865163803100586, -0.08276939392089844, -0.07902240753173828, -0.07527542114257812, -0.07152843475341797, -0.06778144836425781, -0.06403446197509766, -0.0602874755859375, -0.056540489196777344, -0.05279350280761719, -0.04904651641845703, -0.045299530029296875, -0.04155254364013672, -0.03780555725097656, -0.034058570861816406, -0.03031158447265625, -0.026564598083496094, -0.022817611694335938, -0.01907062530517578, -0.015323638916015625, -0.011576652526855469, -0.007829666137695312, -0.004082679748535156, -0.000335693359375, 0.0034112930297851562, 0.0071582794189453125, 0.010905265808105469, 0.014652252197265625, 0.01839923858642578, 0.022146224975585938, 0.025893211364746094, 0.02964019775390625, 0.033387184143066406, 0.03713417053222656, 0.04088115692138672, 0.044628143310546875, 0.04837512969970703, 0.05212211608886719, 0.055869102478027344, 0.0596160888671875, 0.06336307525634766, 0.06711006164550781, 0.07085704803466797, 0.07460403442382812, 0.07835102081298828, 0.08209800720214844, 0.0858449935913086, 0.08959197998046875, 0.0933389663696289, 0.09708595275878906, 0.10083293914794922, 0.10457992553710938, 0.10832691192626953, 0.11207389831542969, 0.11582088470458984, 0.11956787109375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 6.0, 14.0, 22.0, 31.0, 39.0, 137.0, 276.0, 252.0, 90.0, 54.0, 26.0, 17.0, 11.0, 8.0, 8.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0669231414794922e-05, -1.0387971997261047e-05, -1.0106712579727173e-05, -9.825453162193298e-06, -9.544193744659424e-06, -9.26293432712555e-06, -8.981674909591675e-06, -8.7004154920578e-06, -8.419156074523926e-06, -8.137896656990051e-06, -7.856637239456177e-06, -7.575377821922302e-06, -7.294118404388428e-06, -7.012858986854553e-06, -6.731599569320679e-06, -6.450340151786804e-06, -6.16908073425293e-06, -5.887821316719055e-06, -5.606561899185181e-06, -5.325302481651306e-06, -5.044043064117432e-06, -4.762783646583557e-06, -4.481524229049683e-06, -4.200264811515808e-06, -3.919005393981934e-06, -3.637745976448059e-06, -3.3564865589141846e-06, -3.07522714138031e-06, -2.7939677238464355e-06, -2.512708306312561e-06, -2.2314488887786865e-06, -1.950189471244812e-06, -1.6689300537109375e-06, -1.387670636177063e-06, -1.1064112186431885e-06, -8.25151801109314e-07, -5.438923835754395e-07, -2.6263296604156494e-07, 1.862645149230957e-08, 2.998858690261841e-07, 5.811452865600586e-07, 8.624047040939331e-07, 1.1436641216278076e-06, 1.4249235391616821e-06, 1.7061829566955566e-06, 1.987442374229431e-06, 2.2687017917633057e-06, 2.54996120929718e-06, 2.8312206268310547e-06, 3.112480044364929e-06, 3.3937394618988037e-06, 3.6749988794326782e-06, 3.956258296966553e-06, 4.237517714500427e-06, 4.518777132034302e-06, 4.800036549568176e-06, 5.081295967102051e-06, 5.362555384635925e-06, 5.6438148021698e-06, 5.925074219703674e-06, 6.206333637237549e-06, 6.487593054771423e-06, 6.768852472305298e-06, 7.050111889839172e-06, 7.331371307373047e-06]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 8.0, 6.0, 10.0, 9.0, 14.0, 12.0, 15.0, 28.0, 44.0, 63.0, 67.0, 89.0, 133.0, 177.0, 228.0, 250.0, 386.0, 516.0, 639.0, 797.0, 1204.0, 1558.0, 2209.0, 3085.0, 4919.0, 8420.0, 16500.0, 40988.0, 664970.0, 225981.0, 36138.0, 15347.0, 7916.0, 4662.0, 3068.0, 2125.0, 1504.0, 1121.0, 819.0, 626.0, 445.0, 331.0, 280.0, 213.0, 174.0, 124.0, 86.0, 62.0, 45.0, 52.0, 31.0, 18.0, 13.0, 11.0, 9.0, 11.0, 9.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.169189453125, -0.1638927459716797, -0.15859603881835938, -0.15329933166503906, -0.14800262451171875, -0.14270591735839844, -0.13740921020507812, -0.1321125030517578, -0.1268157958984375, -0.12151908874511719, -0.11622238159179688, -0.11092567443847656, -0.10562896728515625, -0.10033226013183594, -0.09503555297851562, -0.08973884582519531, -0.084442138671875, -0.07914543151855469, -0.07384872436523438, -0.06855201721191406, -0.06325531005859375, -0.05795860290527344, -0.052661895751953125, -0.04736518859863281, -0.0420684814453125, -0.03677177429199219, -0.031475067138671875, -0.026178359985351562, -0.02088165283203125, -0.015584945678710938, -0.010288238525390625, -0.0049915313720703125, 0.00030517578125, 0.0056018829345703125, 0.010898590087890625, 0.016195297241210938, 0.02149200439453125, 0.026788711547851562, 0.032085418701171875, 0.03738212585449219, 0.0426788330078125, 0.04797554016113281, 0.053272247314453125, 0.05856895446777344, 0.06386566162109375, 0.06916236877441406, 0.07445907592773438, 0.07975578308105469, 0.085052490234375, 0.09034919738769531, 0.09564590454101562, 0.10094261169433594, 0.10623931884765625, 0.11153602600097656, 0.11683273315429688, 0.12212944030761719, 0.1274261474609375, 0.1327228546142578, 0.13801956176757812, 0.14331626892089844, 0.14861297607421875, 0.15390968322753906, 0.15920639038085938, 0.1645030975341797, 0.1697998046875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 7.0, 7.0, 7.0, 5.0, 16.0, 21.0, 34.0, 59.0, 308.0, 308.0, 61.0, 29.0, 33.0, 27.0, 12.0, 13.0, 9.0, 5.0, 5.0, 7.0, 2.0, 4.0, 2.0, 2.0, 1.0, 5.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.055816650390625, -0.054071903228759766, -0.05232715606689453, -0.0505824089050293, -0.04883766174316406, -0.04709291458129883, -0.045348167419433594, -0.04360342025756836, -0.041858673095703125, -0.04011392593383789, -0.038369178771972656, -0.03662443161010742, -0.03487968444824219, -0.03313493728637695, -0.03139019012451172, -0.029645442962646484, -0.02790069580078125, -0.026155948638916016, -0.02441120147705078, -0.022666454315185547, -0.020921707153320312, -0.019176959991455078, -0.017432212829589844, -0.01568746566772461, -0.013942718505859375, -0.01219797134399414, -0.010453224182128906, -0.008708477020263672, -0.0069637298583984375, -0.005218982696533203, -0.0034742355346679688, -0.0017294883728027344, 1.52587890625e-05, 0.0017600059509277344, 0.0035047531127929688, 0.005249500274658203, 0.0069942474365234375, 0.008738994598388672, 0.010483741760253906, 0.01222848892211914, 0.013973236083984375, 0.01571798324584961, 0.017462730407714844, 0.019207477569580078, 0.020952224731445312, 0.022696971893310547, 0.02444171905517578, 0.026186466217041016, 0.02793121337890625, 0.029675960540771484, 0.03142070770263672, 0.03316545486450195, 0.03491020202636719, 0.03665494918823242, 0.038399696350097656, 0.04014444351196289, 0.041889190673828125, 0.04363393783569336, 0.045378684997558594, 0.04712343215942383, 0.04886817932128906, 0.0506129264831543, 0.05235767364501953, 0.054102420806884766, 0.05584716796875]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 0.0, 3.0, 5.0, 11.0, 4.0, 6.0, 11.0, 10.0, 10.0, 13.0, 15.0, 18.0, 39.0, 44.0, 70.0, 72.0, 88.0, 124.0, 91.0, 67.0, 51.0, 39.0, 51.0, 42.0, 18.0, 18.0, 19.0, 11.0, 6.0, 6.0, 9.0, 3.0, 6.0, 3.0, 4.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.7507361769676208, -0.7308685779571533, -0.7110009789466858, -0.6911333203315735, -0.671265721321106, -0.6513981223106384, -0.6315305233001709, -0.6116629242897034, -0.5917953252792358, -0.5719277262687683, -0.5520601272583008, -0.5321924686431885, -0.512324869632721, -0.4924572706222534, -0.4725896716117859, -0.45272207260131836, -0.43285441398620605, -0.4129868149757385, -0.3931191861629486, -0.3732515871524811, -0.35338395833969116, -0.33351635932922363, -0.3136487603187561, -0.2937811613082886, -0.27391353249549866, -0.25404593348503113, -0.2341783046722412, -0.21431070566177368, -0.19444309175014496, -0.17457547783851624, -0.1547078788280487, -0.13484026491641998, -0.11497271060943604, -0.09510509669780731, -0.07523749023675919, -0.05536988005042076, -0.035502269864082336, -0.015634655952453613, 0.004232950508594513, 0.02410055696964264, 0.04396817088127136, 0.06383578479290009, 0.08370339125394821, 0.10357099771499634, 0.12343861162662506, 0.14330622553825378, 0.1631738245487213, 0.18304143846035004, 0.20290905237197876, 0.22277666628360748, 0.2426442801952362, 0.26251187920570374, 0.28237950801849365, 0.3022471070289612, 0.3221147060394287, 0.34198230504989624, 0.36184993386268616, 0.3817175328731537, 0.4015851616859436, 0.42145276069641113, 0.44132035970687866, 0.4611879885196686, 0.4810555875301361, 0.500923216342926, 0.5207908153533936]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 5.0, 4.0, 2.0, 7.0, 8.0, 11.0, 8.0, 9.0, 15.0, 28.0, 16.0, 17.0, 20.0, 17.0, 33.0, 46.0, 38.0, 37.0, 31.0, 51.0, 34.0, 47.0, 39.0, 38.0, 41.0, 43.0, 39.0, 38.0, 43.0, 31.0, 18.0, 25.0, 24.0, 21.0, 24.0, 14.0, 16.0, 11.0, 11.0, 7.0, 11.0, 3.0, 7.0, 7.0, 3.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.44486716389656067, -0.43124186992645264, -0.417616605758667, -0.40399131178855896, -0.3903660476207733, -0.3767407536506653, -0.36311548948287964, -0.3494901955127716, -0.3358649015426636, -0.32223960757255554, -0.3086143434047699, -0.29498904943466187, -0.2813637852668762, -0.2677384912967682, -0.25411319732666016, -0.2404879331588745, -0.22686266899108887, -0.21323738992214203, -0.1996121108531952, -0.18598681688308716, -0.1723615527153015, -0.15873625874519348, -0.14511097967624664, -0.1314857006072998, -0.11786042153835297, -0.10423514246940613, -0.09060986340045929, -0.07698457688093185, -0.06335929781198502, -0.04973401874303818, -0.03610873222351074, -0.022483453154563904, -0.008858174085617065, 0.004767106845974922, 0.01839238777756691, 0.03201767057180405, 0.045642949640750885, 0.05926822870969772, 0.07289351522922516, 0.086518794298172, 0.10014407336711884, 0.11376935243606567, 0.1273946315050125, 0.14101991057395935, 0.15464520454406738, 0.16827046871185303, 0.18189576268196106, 0.1955210417509079, 0.20914632081985474, 0.22277159988880157, 0.2363968789577484, 0.25002217292785645, 0.2636474370956421, 0.2772727310657501, 0.29089802503585815, 0.3045232892036438, 0.31814855337142944, 0.3317738473415375, 0.3453991115093231, 0.35902440547943115, 0.3726496696472168, 0.38627496361732483, 0.39990025758743286, 0.4135255217552185, 0.42715081572532654]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 9.0, 3.0, 11.0, 10.0, 12.0, 25.0, 35.0, 62.0, 110.0, 172.0, 272.0, 533.0, 845.0, 1560.0, 2547.0, 4601.0, 8070.0, 15130.0, 28854.0, 60252.0, 138751.0, 429920.0, 2122439.0, 978998.0, 223167.0, 87065.0, 41469.0, 21416.0, 12056.0, 6675.0, 3877.0, 2179.0, 1374.0, 717.0, 420.0, 246.0, 161.0, 69.0, 44.0, 39.0, 41.0, 18.0, 18.0, 7.0, 3.0, 5.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76025390625, -0.7338027954101562, -0.7073516845703125, -0.6809005737304688, -0.654449462890625, -0.6279983520507812, -0.6015472412109375, -0.5750961303710938, -0.54864501953125, -0.5221939086914062, -0.4957427978515625, -0.46929168701171875, -0.442840576171875, -0.41638946533203125, -0.3899383544921875, -0.36348724365234375, -0.3370361328125, -0.31058502197265625, -0.2841339111328125, -0.25768280029296875, -0.231231689453125, -0.20478057861328125, -0.1783294677734375, -0.15187835693359375, -0.12542724609375, -0.09897613525390625, -0.0725250244140625, -0.04607391357421875, -0.019622802734375, 0.00682830810546875, 0.0332794189453125, 0.05973052978515625, 0.086181640625, 0.11263275146484375, 0.1390838623046875, 0.16553497314453125, 0.191986083984375, 0.21843719482421875, 0.2448883056640625, 0.27133941650390625, 0.29779052734375, 0.32424163818359375, 0.3506927490234375, 0.37714385986328125, 0.403594970703125, 0.43004608154296875, 0.4564971923828125, 0.48294830322265625, 0.5093994140625, 0.5358505249023438, 0.5623016357421875, 0.5887527465820312, 0.615203857421875, 0.6416549682617188, 0.6681060791015625, 0.6945571899414062, 0.72100830078125, 0.7474594116210938, 0.7739105224609375, 0.8003616333007812, 0.826812744140625, 0.8532638549804688, 0.8797149658203125, 0.9061660766601562, 0.9326171875]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 5.0, 5.0, 3.0, 8.0, 7.0, 11.0, 22.0, 16.0, 18.0, 16.0, 20.0, 14.0, 21.0, 40.0, 37.0, 40.0, 25.0, 45.0, 43.0, 55.0, 28.0, 39.0, 41.0, 31.0, 35.0, 55.0, 30.0, 32.0, 29.0, 26.0, 19.0, 25.0, 23.0, 21.0, 13.0, 15.0, 10.0, 13.0, 12.0, 14.0, 5.0, 6.0, 9.0, 5.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.24755859375, -0.23968887329101562, -0.23181915283203125, -0.22394943237304688, -0.2160797119140625, -0.20820999145507812, -0.20034027099609375, -0.19247055053710938, -0.184600830078125, -0.17673110961914062, -0.16886138916015625, -0.16099166870117188, -0.1531219482421875, -0.14525222778320312, -0.13738250732421875, -0.12951278686523438, -0.12164306640625, -0.11377334594726562, -0.10590362548828125, -0.09803390502929688, -0.0901641845703125, -0.08229446411132812, -0.07442474365234375, -0.06655502319335938, -0.058685302734375, -0.050815582275390625, -0.04294586181640625, -0.035076141357421875, -0.0272064208984375, -0.019336700439453125, -0.01146697998046875, -0.003597259521484375, 0.0042724609375, 0.012142181396484375, 0.02001190185546875, 0.027881622314453125, 0.0357513427734375, 0.043621063232421875, 0.05149078369140625, 0.059360504150390625, 0.067230224609375, 0.07509994506835938, 0.08296966552734375, 0.09083938598632812, 0.0987091064453125, 0.10657882690429688, 0.11444854736328125, 0.12231826782226562, 0.13018798828125, 0.13805770874023438, 0.14592742919921875, 0.15379714965820312, 0.1616668701171875, 0.16953659057617188, 0.17740631103515625, 0.18527603149414062, 0.193145751953125, 0.20101547241210938, 0.20888519287109375, 0.21675491333007812, 0.2246246337890625, 0.23249435424804688, 0.24036407470703125, 0.24823379516601562, 0.256103515625]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 11.0, 17.0, 24.0, 34.0, 47.0, 66.0, 106.0, 148.0, 215.0, 361.0, 511.0, 787.0, 1187.0, 1940.0, 3049.0, 4979.0, 8211.0, 14166.0, 24557.0, 44936.0, 85211.0, 170368.0, 376385.0, 1066334.0, 1478174.0, 479975.0, 208037.0, 101431.0, 52806.0, 28890.0, 16494.0, 9547.0, 5666.0, 3475.0, 2168.0, 1411.0, 877.0, 559.0, 373.0, 244.0, 166.0, 111.0, 82.0, 56.0, 29.0, 28.0, 14.0, 7.0, 5.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.52783203125, -0.5114059448242188, -0.4949798583984375, -0.47855377197265625, -0.462127685546875, -0.44570159912109375, -0.4292755126953125, -0.41284942626953125, -0.39642333984375, -0.37999725341796875, -0.3635711669921875, -0.34714508056640625, -0.330718994140625, -0.31429290771484375, -0.2978668212890625, -0.28144073486328125, -0.2650146484375, -0.24858856201171875, -0.2321624755859375, -0.21573638916015625, -0.199310302734375, -0.18288421630859375, -0.1664581298828125, -0.15003204345703125, -0.13360595703125, -0.11717987060546875, -0.1007537841796875, -0.08432769775390625, -0.067901611328125, -0.05147552490234375, -0.0350494384765625, -0.01862335205078125, -0.002197265625, 0.01422882080078125, 0.0306549072265625, 0.04708099365234375, 0.063507080078125, 0.07993316650390625, 0.0963592529296875, 0.11278533935546875, 0.12921142578125, 0.14563751220703125, 0.1620635986328125, 0.17848968505859375, 0.194915771484375, 0.21134185791015625, 0.2277679443359375, 0.24419403076171875, 0.2606201171875, 0.27704620361328125, 0.2934722900390625, 0.30989837646484375, 0.326324462890625, 0.34275054931640625, 0.3591766357421875, 0.37560272216796875, 0.39202880859375, 0.40845489501953125, 0.4248809814453125, 0.44130706787109375, 0.457733154296875, 0.47415924072265625, 0.4905853271484375, 0.5070114135742188, 0.5234375]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 7.0, 13.0, 5.0, 15.0, 18.0, 31.0, 29.0, 37.0, 39.0, 60.0, 71.0, 87.0, 105.0, 110.0, 136.0, 188.0, 199.0, 246.0, 266.0, 284.0, 313.0, 285.0, 219.0, 227.0, 207.0, 149.0, 131.0, 118.0, 91.0, 87.0, 69.0, 58.0, 33.0, 26.0, 34.0, 14.0, 11.0, 12.0, 8.0, 8.0, 12.0, 6.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1591796875, -0.15453338623046875, -0.1498870849609375, -0.14524078369140625, -0.140594482421875, -0.13594818115234375, -0.1313018798828125, -0.12665557861328125, -0.12200927734375, -0.11736297607421875, -0.1127166748046875, -0.10807037353515625, -0.103424072265625, -0.09877777099609375, -0.0941314697265625, -0.08948516845703125, -0.0848388671875, -0.08019256591796875, -0.0755462646484375, -0.07089996337890625, -0.066253662109375, -0.06160736083984375, -0.0569610595703125, -0.05231475830078125, -0.04766845703125, -0.04302215576171875, -0.0383758544921875, -0.03372955322265625, -0.029083251953125, -0.02443695068359375, -0.0197906494140625, -0.01514434814453125, -0.010498046875, -0.00585174560546875, -0.0012054443359375, 0.00344085693359375, 0.008087158203125, 0.01273345947265625, 0.0173797607421875, 0.02202606201171875, 0.02667236328125, 0.03131866455078125, 0.0359649658203125, 0.04061126708984375, 0.045257568359375, 0.04990386962890625, 0.0545501708984375, 0.05919647216796875, 0.0638427734375, 0.06848907470703125, 0.0731353759765625, 0.07778167724609375, 0.082427978515625, 0.08707427978515625, 0.0917205810546875, 0.09636688232421875, 0.10101318359375, 0.10565948486328125, 0.1103057861328125, 0.11495208740234375, 0.119598388671875, 0.12424468994140625, 0.1288909912109375, 0.13353729248046875, 0.13818359375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 4.0, 8.0, 4.0, 5.0, 6.0, 7.0, 14.0, 13.0, 20.0, 18.0, 24.0, 34.0, 51.0, 79.0, 93.0, 88.0, 102.0, 87.0, 80.0, 45.0, 53.0, 44.0, 23.0, 20.0, 16.0, 15.0, 17.0, 6.0, 4.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0], "bins": [-0.5478900671005249, -0.5339280366897583, -0.5199660062789917, -0.5060039758682251, -0.4920419454574585, -0.4780799150466919, -0.4641178846359253, -0.4501558542251587, -0.4361938238143921, -0.4222317934036255, -0.4082697629928589, -0.3943077325820923, -0.3803457021713257, -0.3663836717605591, -0.3524216413497925, -0.3384596109390259, -0.3244975805282593, -0.3105355501174927, -0.2965735197067261, -0.2826114892959595, -0.26864945888519287, -0.25468742847442627, -0.24072539806365967, -0.22676336765289307, -0.21280130743980408, -0.19883927702903748, -0.18487724661827087, -0.17091521620750427, -0.15695318579673767, -0.14299115538597107, -0.12902912497520447, -0.11506708711385727, -0.10110506415367126, -0.08714303374290466, -0.07318100333213806, -0.05921896919608116, -0.04525693878531456, -0.03129490464925766, -0.01733287423849106, -0.003370843827724457, 0.010591186583042145, 0.024553216993808746, 0.03851524740457535, 0.05247728154063225, 0.06643931567668915, 0.08040134608745575, 0.09436337649822235, 0.10832540690898895, 0.12228743731975555, 0.13624946773052216, 0.15021149814128876, 0.16417352855205536, 0.17813555896282196, 0.19209760427474976, 0.20605963468551636, 0.22002166509628296, 0.23398369550704956, 0.24794572591781616, 0.26190775632858276, 0.27586978673934937, 0.28983181715011597, 0.30379384756088257, 0.31775587797164917, 0.33171790838241577, 0.3456799387931824]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 10.0, 8.0, 9.0, 16.0, 6.0, 21.0, 21.0, 18.0, 27.0, 17.0, 33.0, 38.0, 35.0, 34.0, 36.0, 35.0, 43.0, 44.0, 43.0, 34.0, 43.0, 40.0, 31.0, 54.0, 32.0, 35.0, 37.0, 29.0, 19.0, 17.0, 25.0, 28.0, 8.0, 12.0, 15.0, 7.0, 8.0, 8.0, 7.0, 5.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3041698634624481, -0.29492777585983276, -0.2856857180595398, -0.27644363045692444, -0.2672015428543091, -0.2579594850540161, -0.24871739745140076, -0.2394753247499466, -0.23023325204849243, -0.22099117934703827, -0.2117490917444229, -0.20250701904296875, -0.1932649463415146, -0.18402287364006042, -0.17478078603744507, -0.1655387133359909, -0.15629662573337555, -0.1470545530319214, -0.13781246542930603, -0.12857039272785187, -0.1193283200263977, -0.11008623987436295, -0.10084415972232819, -0.09160208702087402, -0.08236000686883926, -0.0731179267168045, -0.06387585401535034, -0.05463377386331558, -0.04539169743657112, -0.03614962100982666, -0.0269075408577919, -0.017665468156337738, -0.008423388004302979, 0.0008186893537640572, 0.010060766711831093, 0.019302845001220703, 0.028544921427965164, 0.037786997854709625, 0.047029078006744385, 0.05627115070819855, 0.0655132308602333, 0.07475531101226807, 0.08399738371372223, 0.09323946386575699, 0.10248154401779175, 0.11172361671924591, 0.12096569687128067, 0.13020777702331543, 0.1394498497247696, 0.14869192242622375, 0.1579340100288391, 0.16717608273029327, 0.17641815543174744, 0.1856602430343628, 0.19490231573581696, 0.20414438843727112, 0.21338647603988647, 0.22262854874134064, 0.231870636343956, 0.24111270904541016, 0.2503547966480255, 0.2595968544483185, 0.26883894205093384, 0.2780809998512268, 0.28732308745384216]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 6.0, 13.0, 12.0, 22.0, 28.0, 49.0, 61.0, 94.0, 105.0, 198.0, 269.0, 420.0, 609.0, 892.0, 1278.0, 1960.0, 2940.0, 4677.0, 7182.0, 11251.0, 18644.0, 31712.0, 57142.0, 112021.0, 264630.0, 274545.0, 115315.0, 58495.0, 32069.0, 19191.0, 11618.0, 7377.0, 4680.0, 2969.0, 1908.0, 1320.0, 931.0, 571.0, 413.0, 315.0, 224.0, 125.0, 86.0, 62.0, 45.0, 30.0, 14.0, 14.0, 13.0, 9.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.099609375, -0.09649848937988281, -0.09338760375976562, -0.09027671813964844, -0.08716583251953125, -0.08405494689941406, -0.08094406127929688, -0.07783317565917969, -0.0747222900390625, -0.07161140441894531, -0.06850051879882812, -0.06538963317871094, -0.06227874755859375, -0.05916786193847656, -0.056056976318359375, -0.05294609069824219, -0.049835205078125, -0.04672431945800781, -0.043613433837890625, -0.04050254821777344, -0.03739166259765625, -0.03428077697753906, -0.031169891357421875, -0.028059005737304688, -0.0249481201171875, -0.021837234497070312, -0.018726348876953125, -0.015615463256835938, -0.01250457763671875, -0.009393692016601562, -0.006282806396484375, -0.0031719207763671875, -6.103515625e-05, 0.0030498504638671875, 0.006160736083984375, 0.009271621704101562, 0.01238250732421875, 0.015493392944335938, 0.018604278564453125, 0.021715164184570312, 0.0248260498046875, 0.027936935424804688, 0.031047821044921875, 0.03415870666503906, 0.03726959228515625, 0.04038047790527344, 0.043491363525390625, 0.04660224914550781, 0.049713134765625, 0.05282402038574219, 0.055934906005859375, 0.05904579162597656, 0.06215667724609375, 0.06526756286621094, 0.06837844848632812, 0.07148933410644531, 0.0746002197265625, 0.07771110534667969, 0.08082199096679688, 0.08393287658691406, 0.08704376220703125, 0.09015464782714844, 0.09326553344726562, 0.09637641906738281, 0.0994873046875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 6.0, 6.0, 10.0, 6.0, 14.0, 18.0, 16.0, 10.0, 22.0, 18.0, 24.0, 26.0, 31.0, 38.0, 26.0, 35.0, 37.0, 35.0, 45.0, 53.0, 38.0, 45.0, 29.0, 39.0, 34.0, 43.0, 32.0, 24.0, 37.0, 24.0, 33.0, 23.0, 18.0, 11.0, 26.0, 12.0, 7.0, 9.0, 8.0, 8.0, 5.0, 6.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.30615234375, -0.29705047607421875, -0.2879486083984375, -0.27884674072265625, -0.269744873046875, -0.26064300537109375, -0.2515411376953125, -0.24243927001953125, -0.23333740234375, -0.22423553466796875, -0.2151336669921875, -0.20603179931640625, -0.196929931640625, -0.18782806396484375, -0.1787261962890625, -0.16962432861328125, -0.1605224609375, -0.15142059326171875, -0.1423187255859375, -0.13321685791015625, -0.124114990234375, -0.11501312255859375, -0.1059112548828125, -0.09680938720703125, -0.08770751953125, -0.07860565185546875, -0.0695037841796875, -0.06040191650390625, -0.051300048828125, -0.04219818115234375, -0.0330963134765625, -0.02399444580078125, -0.014892578125, -0.00579071044921875, 0.0033111572265625, 0.01241302490234375, 0.021514892578125, 0.03061676025390625, 0.0397186279296875, 0.04882049560546875, 0.05792236328125, 0.06702423095703125, 0.0761260986328125, 0.08522796630859375, 0.094329833984375, 0.10343170166015625, 0.1125335693359375, 0.12163543701171875, 0.1307373046875, 0.13983917236328125, 0.1489410400390625, 0.15804290771484375, 0.167144775390625, 0.17624664306640625, 0.1853485107421875, 0.19445037841796875, 0.20355224609375, 0.21265411376953125, 0.2217559814453125, 0.23085784912109375, 0.239959716796875, 0.24906158447265625, 0.2581634521484375, 0.26726531982421875, 0.2763671875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 0.0, 1.0, 5.0, 7.0, 14.0, 17.0, 13.0, 17.0, 24.0, 39.0, 65.0, 80.0, 108.0, 189.0, 255.0, 387.0, 608.0, 937.0, 1499.0, 2457.0, 4319.0, 7700.0, 15128.0, 32050.0, 77594.0, 254539.0, 445467.0, 117105.0, 44325.0, 20024.0, 9993.0, 5404.0, 3127.0, 1790.0, 1105.0, 697.0, 452.0, 327.0, 179.0, 144.0, 122.0, 63.0, 53.0, 35.0, 25.0, 21.0, 16.0, 7.0, 8.0, 6.0, 7.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.19091796875, -0.18549346923828125, -0.1800689697265625, -0.17464447021484375, -0.169219970703125, -0.16379547119140625, -0.1583709716796875, -0.15294647216796875, -0.14752197265625, -0.14209747314453125, -0.1366729736328125, -0.13124847412109375, -0.125823974609375, -0.12039947509765625, -0.1149749755859375, -0.10955047607421875, -0.1041259765625, -0.09870147705078125, -0.0932769775390625, -0.08785247802734375, -0.082427978515625, -0.07700347900390625, -0.0715789794921875, -0.06615447998046875, -0.06072998046875, -0.05530548095703125, -0.0498809814453125, -0.04445648193359375, -0.039031982421875, -0.03360748291015625, -0.0281829833984375, -0.02275848388671875, -0.017333984375, -0.01190948486328125, -0.0064849853515625, -0.00106048583984375, 0.004364013671875, 0.00978851318359375, 0.0152130126953125, 0.02063751220703125, 0.02606201171875, 0.03148651123046875, 0.0369110107421875, 0.04233551025390625, 0.047760009765625, 0.05318450927734375, 0.0586090087890625, 0.06403350830078125, 0.0694580078125, 0.07488250732421875, 0.0803070068359375, 0.08573150634765625, 0.091156005859375, 0.09658050537109375, 0.1020050048828125, 0.10742950439453125, 0.11285400390625, 0.11827850341796875, 0.1237030029296875, 0.12912750244140625, 0.134552001953125, 0.13997650146484375, 0.1454010009765625, 0.15082550048828125, 0.15625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 8.0, 10.0, 6.0, 8.0, 9.0, 11.0, 13.0, 14.0, 13.0, 20.0, 26.0, 25.0, 27.0, 26.0, 26.0, 32.0, 50.0, 36.0, 36.0, 45.0, 43.0, 40.0, 41.0, 40.0, 37.0, 33.0, 36.0, 27.0, 27.0, 36.0, 24.0, 31.0, 29.0, 17.0, 18.0, 14.0, 15.0, 7.0, 13.0, 6.0, 7.0, 6.0, 5.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1676025390625, -0.16168785095214844, -0.15577316284179688, -0.1498584747314453, -0.14394378662109375, -0.1380290985107422, -0.13211441040039062, -0.12619972229003906, -0.1202850341796875, -0.11437034606933594, -0.10845565795898438, -0.10254096984863281, -0.09662628173828125, -0.09071159362792969, -0.08479690551757812, -0.07888221740722656, -0.072967529296875, -0.06705284118652344, -0.061138153076171875, -0.05522346496582031, -0.04930877685546875, -0.04339408874511719, -0.037479400634765625, -0.03156471252441406, -0.0256500244140625, -0.019735336303710938, -0.013820648193359375, -0.007905960083007812, -0.00199127197265625, 0.0039234161376953125, 0.009838104248046875, 0.015752792358398438, 0.02166748046875, 0.027582168579101562, 0.033496856689453125, 0.03941154479980469, 0.04532623291015625, 0.05124092102050781, 0.057155609130859375, 0.06307029724121094, 0.0689849853515625, 0.07489967346191406, 0.08081436157226562, 0.08672904968261719, 0.09264373779296875, 0.09855842590332031, 0.10447311401367188, 0.11038780212402344, 0.116302490234375, 0.12221717834472656, 0.12813186645507812, 0.1340465545654297, 0.13996124267578125, 0.1458759307861328, 0.15179061889648438, 0.15770530700683594, 0.1636199951171875, 0.16953468322753906, 0.17544937133789062, 0.1813640594482422, 0.18727874755859375, 0.1931934356689453, 0.19910812377929688, 0.20502281188964844, 0.2109375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 7.0, 12.0, 15.0, 21.0, 23.0, 36.0, 49.0, 55.0, 105.0, 159.0, 225.0, 402.0, 735.0, 1268.0, 2509.0, 4788.0, 10539.0, 25142.0, 75688.0, 583008.0, 255106.0, 52646.0, 19139.0, 8247.0, 3900.0, 1991.0, 1086.0, 654.0, 361.0, 234.0, 143.0, 84.0, 54.0, 39.0, 20.0, 11.0, 13.0, 9.0, 6.0, 9.0, 3.0, 0.0, 3.0, 3.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.015625, -0.015064001083374023, -0.014503002166748047, -0.01394200325012207, -0.013381004333496094, -0.012820005416870117, -0.01225900650024414, -0.011698007583618164, -0.011137008666992188, -0.010576009750366211, -0.010015010833740234, -0.009454011917114258, -0.008893013000488281, -0.008332014083862305, -0.007771015167236328, -0.0072100162506103516, -0.006649017333984375, -0.0060880184173583984, -0.005527019500732422, -0.004966020584106445, -0.004405021667480469, -0.003844022750854492, -0.0032830238342285156, -0.002722024917602539, -0.0021610260009765625, -0.001600027084350586, -0.0010390281677246094, -0.0004780292510986328, 8.296966552734375e-05, 0.0006439685821533203, 0.0012049674987792969, 0.0017659664154052734, 0.00232696533203125, 0.0028879642486572266, 0.003448963165283203, 0.00400996208190918, 0.004570960998535156, 0.005131959915161133, 0.005692958831787109, 0.006253957748413086, 0.0068149566650390625, 0.007375955581665039, 0.007936954498291016, 0.008497953414916992, 0.009058952331542969, 0.009619951248168945, 0.010180950164794922, 0.010741949081420898, 0.011302947998046875, 0.011863946914672852, 0.012424945831298828, 0.012985944747924805, 0.013546943664550781, 0.014107942581176758, 0.014668941497802734, 0.015229940414428711, 0.015790939331054688, 0.016351938247680664, 0.01691293716430664, 0.017473936080932617, 0.018034934997558594, 0.01859593391418457, 0.019156932830810547, 0.019717931747436523, 0.0202789306640625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 3.0, 0.0, 0.0, 14.0, 0.0, 4.0, 20.0, 19.0, 0.0, 23.0, 35.0, 0.0, 58.0, 71.0, 75.0, 0.0, 76.0, 90.0, 0.0, 69.0, 88.0, 75.0, 0.0, 45.0, 64.0, 46.0, 0.0, 26.0, 35.0, 0.0, 19.0, 16.0, 9.0, 0.0, 7.0, 5.0, 0.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3709068298339844e-06, -1.3280659914016724e-06, -1.2852251529693604e-06, -1.2423843145370483e-06, -1.1995434761047363e-06, -1.1567026376724243e-06, -1.1138617992401123e-06, -1.0710209608078003e-06, -1.0281801223754883e-06, -9.853392839431763e-07, -9.424984455108643e-07, -8.996576070785522e-07, -8.568167686462402e-07, -8.139759302139282e-07, -7.711350917816162e-07, -7.282942533493042e-07, -6.854534149169922e-07, -6.426125764846802e-07, -5.997717380523682e-07, -5.569308996200562e-07, -5.140900611877441e-07, -4.7124922275543213e-07, -4.284083843231201e-07, -3.855675458908081e-07, -3.427267074584961e-07, -2.998858690261841e-07, -2.5704503059387207e-07, -2.1420419216156006e-07, -1.7136335372924805e-07, -1.2852251529693604e-07, -8.568167686462402e-08, -4.284083843231201e-08, 0.0, 4.284083843231201e-08, 8.568167686462402e-08, 1.2852251529693604e-07, 1.7136335372924805e-07, 2.1420419216156006e-07, 2.5704503059387207e-07, 2.998858690261841e-07, 3.427267074584961e-07, 3.855675458908081e-07, 4.284083843231201e-07, 4.7124922275543213e-07, 5.140900611877441e-07, 5.569308996200562e-07, 5.997717380523682e-07, 6.426125764846802e-07, 6.854534149169922e-07, 7.282942533493042e-07, 7.711350917816162e-07, 8.139759302139282e-07, 8.568167686462402e-07, 8.996576070785522e-07, 9.424984455108643e-07, 9.853392839431763e-07, 1.0281801223754883e-06, 1.0710209608078003e-06, 1.1138617992401123e-06, 1.1567026376724243e-06, 1.1995434761047363e-06, 1.2423843145370483e-06, 1.2852251529693604e-06, 1.3280659914016724e-06, 1.3709068298339844e-06]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 6.0, 3.0, 7.0, 15.0, 19.0, 27.0, 44.0, 60.0, 85.0, 115.0, 170.0, 278.0, 413.0, 679.0, 1213.0, 1931.0, 3313.0, 5928.0, 11505.0, 22691.0, 50341.0, 138546.0, 524259.0, 173156.0, 59022.0, 25999.0, 12747.0, 6761.0, 3733.0, 2137.0, 1203.0, 774.0, 445.0, 312.0, 207.0, 145.0, 78.0, 51.0, 35.0, 30.0, 24.0, 11.0, 12.0, 9.0, 4.0, 3.0, 4.0, 2.0, 6.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0173187255859375, -0.016787290573120117, -0.016255855560302734, -0.01572442054748535, -0.015192985534667969, -0.014661550521850586, -0.014130115509033203, -0.01359868049621582, -0.013067245483398438, -0.012535810470581055, -0.012004375457763672, -0.011472940444946289, -0.010941505432128906, -0.010410070419311523, -0.00987863540649414, -0.009347200393676758, -0.008815765380859375, -0.008284330368041992, -0.007752895355224609, -0.0072214603424072266, -0.006690025329589844, -0.006158590316772461, -0.005627155303955078, -0.005095720291137695, -0.0045642852783203125, -0.00403285026550293, -0.003501415252685547, -0.002969980239868164, -0.0024385452270507812, -0.0019071102142333984, -0.0013756752014160156, -0.0008442401885986328, -0.00031280517578125, 0.0002186298370361328, 0.0007500648498535156, 0.0012814998626708984, 0.0018129348754882812, 0.002344369888305664, 0.002875804901123047, 0.0034072399139404297, 0.0039386749267578125, 0.004470109939575195, 0.005001544952392578, 0.005532979965209961, 0.006064414978027344, 0.0065958499908447266, 0.007127285003662109, 0.007658720016479492, 0.008190155029296875, 0.008721590042114258, 0.00925302505493164, 0.009784460067749023, 0.010315895080566406, 0.010847330093383789, 0.011378765106201172, 0.011910200119018555, 0.012441635131835938, 0.01297307014465332, 0.013504505157470703, 0.014035940170288086, 0.014567375183105469, 0.015098810195922852, 0.015630245208740234, 0.016161680221557617, 0.016693115234375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 7.0, 6.0, 4.0, 9.0, 8.0, 8.0, 17.0, 9.0, 31.0, 21.0, 28.0, 46.0, 41.0, 53.0, 76.0, 71.0, 100.0, 93.0, 66.0, 61.0, 52.0, 25.0, 27.0, 24.0, 12.0, 19.0, 13.0, 16.0, 12.0, 11.0, 10.0, 2.0, 6.0, 4.0, 2.0, 2.0, 6.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.004383087158203125, -0.004263818264007568, -0.004144549369812012, -0.004025280475616455, -0.0039060115814208984, -0.003786742687225342, -0.003667473793029785, -0.0035482048988342285, -0.003428936004638672, -0.0033096671104431152, -0.0031903982162475586, -0.003071129322052002, -0.0029518604278564453, -0.0028325915336608887, -0.002713322639465332, -0.0025940537452697754, -0.0024747848510742188, -0.002355515956878662, -0.0022362470626831055, -0.002116978168487549, -0.001997709274291992, -0.0018784403800964355, -0.001759171485900879, -0.0016399025917053223, -0.0015206336975097656, -0.001401364803314209, -0.0012820959091186523, -0.0011628270149230957, -0.001043558120727539, -0.0009242892265319824, -0.0008050203323364258, -0.0006857514381408691, -0.0005664825439453125, -0.00044721364974975586, -0.0003279447555541992, -0.00020867586135864258, -8.940696716308594e-05, 2.9861927032470703e-05, 0.00014913082122802734, 0.000268399715423584, 0.0003876686096191406, 0.0005069375038146973, 0.0006262063980102539, 0.0007454752922058105, 0.0008647441864013672, 0.0009840130805969238, 0.0011032819747924805, 0.0012225508689880371, 0.0013418197631835938, 0.0014610886573791504, 0.001580357551574707, 0.0016996264457702637, 0.0018188953399658203, 0.001938164234161377, 0.0020574331283569336, 0.0021767020225524902, 0.002295970916748047, 0.0024152398109436035, 0.00253450870513916, 0.002653777599334717, 0.0027730464935302734, 0.00289231538772583, 0.0030115842819213867, 0.0031308531761169434, 0.0032501220703125]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 7.0, 5.0, 4.0, 6.0, 6.0, 7.0, 7.0, 18.0, 16.0, 13.0, 21.0, 34.0, 33.0, 72.0, 83.0, 93.0, 93.0, 103.0, 77.0, 61.0, 54.0, 46.0, 34.0, 25.0, 15.0, 14.0, 23.0, 7.0, 4.0, 5.0, 6.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.5413714647293091, -0.5274186730384827, -0.5134658217430115, -0.49951300024986267, -0.48556017875671387, -0.47160735726356506, -0.45765453577041626, -0.44370174407958984, -0.42974889278411865, -0.41579607129096985, -0.40184324979782104, -0.38789042830467224, -0.37393760681152344, -0.35998478531837463, -0.34603196382522583, -0.3320791721343994, -0.3181263506412506, -0.3041735291481018, -0.290220707654953, -0.2762678861618042, -0.2623150646686554, -0.2483622431755066, -0.23440943658351898, -0.22045661509037018, -0.20650379359722137, -0.19255097210407257, -0.17859815061092377, -0.16464534401893616, -0.15069252252578735, -0.13673970103263855, -0.12278687953948975, -0.10883405804634094, -0.09488126635551453, -0.08092844486236572, -0.06697562336921692, -0.05302280932664871, -0.03906998783349991, -0.025117166340351105, -0.011164352297782898, 0.0027884691953659058, 0.01674129068851471, 0.030694110319018364, 0.04464692994952202, 0.058599747717380524, 0.07255256921052933, 0.08650539070367813, 0.10045820474624634, 0.11441102623939514, 0.12836384773254395, 0.14231666922569275, 0.15626949071884155, 0.17022231221199036, 0.18417513370513916, 0.19812795519828796, 0.21208076179027557, 0.22603358328342438, 0.23998640477657318, 0.2539392113685608, 0.2678920328617096, 0.2818448543548584, 0.2957976758480072, 0.309750497341156, 0.3237033188343048, 0.3376561403274536, 0.3516089618206024]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 10.0, 10.0, 8.0, 14.0, 7.0, 21.0, 22.0, 19.0, 27.0, 18.0, 33.0, 35.0, 39.0, 30.0, 35.0, 38.0, 41.0, 45.0, 48.0, 30.0, 47.0, 36.0, 34.0, 51.0, 30.0, 36.0, 38.0, 26.0, 22.0, 15.0, 26.0, 26.0, 9.0, 11.0, 15.0, 8.0, 7.0, 8.0, 7.0, 6.0, 6.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30411532521247864, -0.29490023851394653, -0.28568515181541443, -0.2764700651168823, -0.26725494861602783, -0.2580398619174957, -0.24882477521896362, -0.23960968852043152, -0.23039460182189941, -0.2211795151233673, -0.2119644284248352, -0.2027493268251419, -0.1935342401266098, -0.1843191534280777, -0.1751040518283844, -0.1658889651298523, -0.1566738784313202, -0.14745879173278809, -0.13824370503425598, -0.12902860343456268, -0.11981351673603058, -0.11059843003749847, -0.10138333588838577, -0.09216824173927307, -0.08295315504074097, -0.07373806834220886, -0.06452297419309616, -0.05530788376927376, -0.046092793345451355, -0.03687770292162895, -0.02766261249780655, -0.018447518348693848, -0.009232431650161743, -1.734122633934021e-05, 0.009197749197483063, 0.018412839621305466, 0.02762793004512787, 0.03684302046895027, 0.046058110892772675, 0.055273205041885376, 0.06448829174041748, 0.07370337843894958, 0.08291847258806229, 0.09213356673717499, 0.10134865343570709, 0.1105637401342392, 0.1197788342833519, 0.1289939284324646, 0.1382090151309967, 0.1474241018295288, 0.1566391885280609, 0.1658542901277542, 0.17506937682628632, 0.18428446352481842, 0.19349956512451172, 0.20271465182304382, 0.21192973852157593, 0.22114482522010803, 0.23035991191864014, 0.23957501351833344, 0.24879010021686554, 0.25800520181655884, 0.26722028851509094, 0.27643537521362305, 0.28565046191215515]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 6.0, 17.0, 10.0, 32.0, 38.0, 59.0, 67.0, 104.0, 162.0, 265.0, 362.0, 570.0, 826.0, 1131.0, 1782.0, 2466.0, 3688.0, 5532.0, 8153.0, 12459.0, 19449.0, 31114.0, 50595.0, 88002.0, 168950.0, 284346.0, 154373.0, 82195.0, 47919.0, 29340.0, 18652.0, 11901.0, 7871.0, 5188.0, 3387.0, 2458.0, 1611.0, 1062.0, 700.0, 514.0, 391.0, 255.0, 184.0, 124.0, 86.0, 45.0, 40.0, 26.0, 15.0, 12.0, 7.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0], "bins": [-0.556640625, -0.5394821166992188, -0.5223236083984375, -0.5051651000976562, -0.488006591796875, -0.47084808349609375, -0.4536895751953125, -0.43653106689453125, -0.41937255859375, -0.40221405029296875, -0.3850555419921875, -0.36789703369140625, -0.350738525390625, -0.33358001708984375, -0.3164215087890625, -0.29926300048828125, -0.2821044921875, -0.26494598388671875, -0.2477874755859375, -0.23062896728515625, -0.213470458984375, -0.19631195068359375, -0.1791534423828125, -0.16199493408203125, -0.14483642578125, -0.12767791748046875, -0.1105194091796875, -0.09336090087890625, -0.076202392578125, -0.05904388427734375, -0.0418853759765625, -0.02472686767578125, -0.007568359375, 0.00959014892578125, 0.0267486572265625, 0.04390716552734375, 0.061065673828125, 0.07822418212890625, 0.0953826904296875, 0.11254119873046875, 0.12969970703125, 0.14685821533203125, 0.1640167236328125, 0.18117523193359375, 0.198333740234375, 0.21549224853515625, 0.2326507568359375, 0.24980926513671875, 0.2669677734375, 0.28412628173828125, 0.3012847900390625, 0.31844329833984375, 0.335601806640625, 0.35276031494140625, 0.3699188232421875, 0.38707733154296875, 0.40423583984375, 0.42139434814453125, 0.4385528564453125, 0.45571136474609375, 0.472869873046875, 0.49002838134765625, 0.5071868896484375, 0.5243453979492188, 0.54150390625]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 7.0, 8.0, 3.0, 6.0, 12.0, 15.0, 9.0, 20.0, 20.0, 29.0, 29.0, 32.0, 37.0, 35.0, 20.0, 36.0, 37.0, 39.0, 55.0, 59.0, 38.0, 30.0, 44.0, 38.0, 44.0, 39.0, 34.0, 45.0, 27.0, 21.0, 21.0, 12.0, 17.0, 14.0, 14.0, 11.0, 10.0, 8.0, 8.0, 5.0, 10.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2763671875, -0.2677421569824219, -0.25911712646484375, -0.2504920959472656, -0.2418670654296875, -0.23324203491210938, -0.22461700439453125, -0.21599197387695312, -0.207366943359375, -0.19874191284179688, -0.19011688232421875, -0.18149185180664062, -0.1728668212890625, -0.16424179077148438, -0.15561676025390625, -0.14699172973632812, -0.13836669921875, -0.12974166870117188, -0.12111663818359375, -0.11249160766601562, -0.1038665771484375, -0.09524154663085938, -0.08661651611328125, -0.07799148559570312, -0.069366455078125, -0.060741424560546875, -0.05211639404296875, -0.043491363525390625, -0.0348663330078125, -0.026241302490234375, -0.01761627197265625, -0.008991241455078125, -0.0003662109375, 0.008258819580078125, 0.01688385009765625, 0.025508880615234375, 0.0341339111328125, 0.042758941650390625, 0.05138397216796875, 0.060009002685546875, 0.068634033203125, 0.07725906372070312, 0.08588409423828125, 0.09450912475585938, 0.1031341552734375, 0.11175918579101562, 0.12038421630859375, 0.12900924682617188, 0.13763427734375, 0.14625930786132812, 0.15488433837890625, 0.16350936889648438, 0.1721343994140625, 0.18075942993164062, 0.18938446044921875, 0.19800949096679688, 0.206634521484375, 0.21525955200195312, 0.22388458251953125, 0.23250961303710938, 0.2411346435546875, 0.24975967407226562, 0.25838470458984375, 0.2670097351074219, 0.275634765625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 6.0, 7.0, 7.0, 5.0, 18.0, 22.0, 42.0, 55.0, 93.0, 131.0, 229.0, 347.0, 536.0, 877.0, 1369.0, 2319.0, 3831.0, 6358.0, 10856.0, 19183.0, 34194.0, 63034.0, 122905.0, 271583.0, 256524.0, 116751.0, 59794.0, 32768.0, 18369.0, 10644.0, 6099.0, 3755.0, 2222.0, 1351.0, 836.0, 539.0, 314.0, 216.0, 138.0, 92.0, 53.0, 29.0, 21.0, 13.0, 10.0, 5.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6416015625, -0.620880126953125, -0.60015869140625, -0.579437255859375, -0.5587158203125, -0.537994384765625, -0.51727294921875, -0.496551513671875, -0.475830078125, -0.455108642578125, -0.43438720703125, -0.413665771484375, -0.3929443359375, -0.372222900390625, -0.35150146484375, -0.330780029296875, -0.31005859375, -0.289337158203125, -0.26861572265625, -0.247894287109375, -0.2271728515625, -0.206451416015625, -0.18572998046875, -0.165008544921875, -0.144287109375, -0.123565673828125, -0.10284423828125, -0.082122802734375, -0.0614013671875, -0.040679931640625, -0.01995849609375, 0.000762939453125, 0.021484375, 0.042205810546875, 0.06292724609375, 0.083648681640625, 0.1043701171875, 0.125091552734375, 0.14581298828125, 0.166534423828125, 0.187255859375, 0.207977294921875, 0.22869873046875, 0.249420166015625, 0.2701416015625, 0.290863037109375, 0.31158447265625, 0.332305908203125, 0.35302734375, 0.373748779296875, 0.39447021484375, 0.415191650390625, 0.4359130859375, 0.456634521484375, 0.47735595703125, 0.498077392578125, 0.518798828125, 0.539520263671875, 0.56024169921875, 0.580963134765625, 0.6016845703125, 0.622406005859375, 0.64312744140625, 0.663848876953125, 0.6845703125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 10.0, 10.0, 4.0, 14.0, 8.0, 9.0, 19.0, 24.0, 25.0, 34.0, 27.0, 33.0, 30.0, 30.0, 38.0, 32.0, 40.0, 48.0, 45.0, 45.0, 40.0, 42.0, 42.0, 41.0, 41.0, 46.0, 33.0, 24.0, 23.0, 23.0, 19.0, 25.0, 22.0, 17.0, 12.0, 6.0, 4.0, 5.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1710205078125, -0.1653900146484375, -0.159759521484375, -0.1541290283203125, -0.14849853515625, -0.1428680419921875, -0.137237548828125, -0.1316070556640625, -0.1259765625, -0.1203460693359375, -0.114715576171875, -0.1090850830078125, -0.10345458984375, -0.0978240966796875, -0.092193603515625, -0.0865631103515625, -0.0809326171875, -0.0753021240234375, -0.069671630859375, -0.0640411376953125, -0.05841064453125, -0.0527801513671875, -0.047149658203125, -0.0415191650390625, -0.035888671875, -0.0302581787109375, -0.024627685546875, -0.0189971923828125, -0.01336669921875, -0.0077362060546875, -0.002105712890625, 0.0035247802734375, 0.0091552734375, 0.0147857666015625, 0.020416259765625, 0.0260467529296875, 0.03167724609375, 0.0373077392578125, 0.042938232421875, 0.0485687255859375, 0.05419921875, 0.0598297119140625, 0.065460205078125, 0.0710906982421875, 0.07672119140625, 0.0823516845703125, 0.087982177734375, 0.0936126708984375, 0.0992431640625, 0.1048736572265625, 0.110504150390625, 0.1161346435546875, 0.12176513671875, 0.1273956298828125, 0.133026123046875, 0.1386566162109375, 0.144287109375, 0.1499176025390625, 0.155548095703125, 0.1611785888671875, 0.16680908203125, 0.1724395751953125, 0.178070068359375, 0.1837005615234375, 0.1893310546875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 12.0, 12.0, 10.0, 13.0, 20.0, 21.0, 22.0, 36.0, 50.0, 53.0, 65.0, 82.0, 106.0, 153.0, 186.0, 236.0, 329.0, 398.0, 518.0, 680.0, 882.0, 1199.0, 1767.0, 2593.0, 4108.0, 7427.0, 17146.0, 81842.0, 859752.0, 38953.0, 11997.0, 5975.0, 3509.0, 2248.0, 1582.0, 1036.0, 848.0, 615.0, 486.0, 343.0, 290.0, 200.0, 178.0, 138.0, 93.0, 83.0, 62.0, 54.0, 37.0, 35.0, 22.0, 19.0, 14.0, 11.0, 8.0, 6.0, 2.0, 5.0, 2.0, 3.0], "bins": [-0.08673095703125, -0.08404731750488281, -0.08136367797851562, -0.07868003845214844, -0.07599639892578125, -0.07331275939941406, -0.07062911987304688, -0.06794548034667969, -0.0652618408203125, -0.06257820129394531, -0.059894561767578125, -0.05721092224121094, -0.05452728271484375, -0.05184364318847656, -0.049160003662109375, -0.04647636413574219, -0.043792724609375, -0.04110908508300781, -0.038425445556640625, -0.03574180603027344, -0.03305816650390625, -0.030374526977539062, -0.027690887451171875, -0.025007247924804688, -0.0223236083984375, -0.019639968872070312, -0.016956329345703125, -0.014272689819335938, -0.01158905029296875, -0.008905410766601562, -0.006221771240234375, -0.0035381317138671875, -0.0008544921875, 0.0018291473388671875, 0.004512786865234375, 0.0071964263916015625, 0.00988006591796875, 0.012563705444335938, 0.015247344970703125, 0.017930984497070312, 0.0206146240234375, 0.023298263549804688, 0.025981903076171875, 0.028665542602539062, 0.03134918212890625, 0.03403282165527344, 0.036716461181640625, 0.03940010070800781, 0.042083740234375, 0.04476737976074219, 0.047451019287109375, 0.05013465881347656, 0.05281829833984375, 0.05550193786621094, 0.058185577392578125, 0.06086921691894531, 0.0635528564453125, 0.06623649597167969, 0.06892013549804688, 0.07160377502441406, 0.07428741455078125, 0.07697105407714844, 0.07965469360351562, 0.08233833312988281, 0.08502197265625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 11.0, 10.0, 13.0, 34.0, 58.0, 160.0, 274.0, 240.0, 96.0, 23.0, 33.0, 21.0, 9.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.125999450683594e-06, -4.949048161506653e-06, -4.772096872329712e-06, -4.595145583152771e-06, -4.41819429397583e-06, -4.241243004798889e-06, -4.064291715621948e-06, -3.887340426445007e-06, -3.7103891372680664e-06, -3.5334378480911255e-06, -3.3564865589141846e-06, -3.1795352697372437e-06, -3.0025839805603027e-06, -2.825632691383362e-06, -2.648681402206421e-06, -2.47173011302948e-06, -2.294778823852539e-06, -2.117827534675598e-06, -1.9408762454986572e-06, -1.7639249563217163e-06, -1.5869736671447754e-06, -1.4100223779678345e-06, -1.2330710887908936e-06, -1.0561197996139526e-06, -8.791685104370117e-07, -7.022172212600708e-07, -5.252659320831299e-07, -3.4831464290618896e-07, -1.7136335372924805e-07, 5.587935447692871e-09, 1.825392246246338e-07, 3.594905138015747e-07, 5.364418029785156e-07, 7.133930921554565e-07, 8.903443813323975e-07, 1.0672956705093384e-06, 1.2442469596862793e-06, 1.4211982488632202e-06, 1.5981495380401611e-06, 1.775100827217102e-06, 1.952052116394043e-06, 2.129003405570984e-06, 2.305954694747925e-06, 2.4829059839248657e-06, 2.6598572731018066e-06, 2.8368085622787476e-06, 3.0137598514556885e-06, 3.1907111406326294e-06, 3.3676624298095703e-06, 3.5446137189865112e-06, 3.721565008163452e-06, 3.898516297340393e-06, 4.075467586517334e-06, 4.252418875694275e-06, 4.429370164871216e-06, 4.606321454048157e-06, 4.783272743225098e-06, 4.9602240324020386e-06, 5.1371753215789795e-06, 5.31412661075592e-06, 5.491077899932861e-06, 5.668029189109802e-06, 5.844980478286743e-06, 6.021931767463684e-06, 6.198883056640625e-06]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 7.0, 7.0, 8.0, 7.0, 12.0, 16.0, 28.0, 30.0, 45.0, 62.0, 100.0, 132.0, 181.0, 263.0, 360.0, 536.0, 769.0, 1054.0, 1722.0, 2895.0, 5791.0, 13930.0, 45509.0, 869539.0, 71187.0, 18033.0, 7108.0, 3416.0, 1833.0, 1170.0, 813.0, 590.0, 406.0, 272.0, 213.0, 142.0, 107.0, 63.0, 63.0, 44.0, 22.0, 22.0, 19.0, 7.0, 10.0, 3.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.10498046875, -0.10185813903808594, -0.09873580932617188, -0.09561347961425781, -0.09249114990234375, -0.08936882019042969, -0.08624649047851562, -0.08312416076660156, -0.0800018310546875, -0.07687950134277344, -0.07375717163085938, -0.07063484191894531, -0.06751251220703125, -0.06439018249511719, -0.061267852783203125, -0.05814552307128906, -0.055023193359375, -0.05190086364746094, -0.048778533935546875, -0.04565620422363281, -0.04253387451171875, -0.03941154479980469, -0.036289215087890625, -0.03316688537597656, -0.0300445556640625, -0.026922225952148438, -0.023799896240234375, -0.020677566528320312, -0.01755523681640625, -0.014432907104492188, -0.011310577392578125, -0.008188247680664062, -0.00506591796875, -0.0019435882568359375, 0.001178741455078125, 0.0043010711669921875, 0.00742340087890625, 0.010545730590820312, 0.013668060302734375, 0.016790390014648438, 0.0199127197265625, 0.023035049438476562, 0.026157379150390625, 0.029279708862304688, 0.03240203857421875, 0.03552436828613281, 0.038646697998046875, 0.04176902770996094, 0.044891357421875, 0.04801368713378906, 0.051136016845703125, 0.05425834655761719, 0.05738067626953125, 0.06050300598144531, 0.06362533569335938, 0.06674766540527344, 0.0698699951171875, 0.07299232482910156, 0.07611465454101562, 0.07923698425292969, 0.08235931396484375, 0.08548164367675781, 0.08860397338867188, 0.09172630310058594, 0.0948486328125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 10.0, 10.0, 14.0, 29.0, 24.0, 54.0, 296.0, 400.0, 48.0, 28.0, 24.0, 12.0, 16.0, 7.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022064208984375, -0.02121591567993164, -0.02036762237548828, -0.019519329071044922, -0.018671035766601562, -0.017822742462158203, -0.016974449157714844, -0.016126155853271484, -0.015277862548828125, -0.014429569244384766, -0.013581275939941406, -0.012732982635498047, -0.011884689331054688, -0.011036396026611328, -0.010188102722167969, -0.00933980941772461, -0.00849151611328125, -0.007643222808837891, -0.006794929504394531, -0.005946636199951172, -0.0050983428955078125, -0.004250049591064453, -0.0034017562866210938, -0.0025534629821777344, -0.001705169677734375, -0.0008568763732910156, -8.58306884765625e-06, 0.0008397102355957031, 0.0016880035400390625, 0.002536296844482422, 0.0033845901489257812, 0.004232883453369141, 0.0050811767578125, 0.005929470062255859, 0.006777763366699219, 0.007626056671142578, 0.008474349975585938, 0.009322643280029297, 0.010170936584472656, 0.011019229888916016, 0.011867523193359375, 0.012715816497802734, 0.013564109802246094, 0.014412403106689453, 0.015260696411132812, 0.016108989715576172, 0.01695728302001953, 0.01780557632446289, 0.01865386962890625, 0.01950216293334961, 0.02035045623779297, 0.021198749542236328, 0.022047042846679688, 0.022895336151123047, 0.023743629455566406, 0.024591922760009766, 0.025440216064453125, 0.026288509368896484, 0.027136802673339844, 0.027985095977783203, 0.028833389282226562, 0.029681682586669922, 0.03052997589111328, 0.03137826919555664, 0.0322265625]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 3.0, 7.0, 5.0, 5.0, 7.0, 5.0, 18.0, 22.0, 19.0, 27.0, 30.0, 41.0, 58.0, 48.0, 76.0, 92.0, 96.0, 90.0, 68.0, 53.0, 51.0, 39.0, 30.0, 18.0, 18.0, 13.0, 12.0, 9.0, 7.0, 6.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.35898101329803467, -0.3474760353565216, -0.33597102761268616, -0.3244660496711731, -0.31296104192733765, -0.3014560639858246, -0.2899510860443115, -0.2784460783004761, -0.266941100358963, -0.25543612241744995, -0.2439311146736145, -0.23242613673210144, -0.22092114388942719, -0.20941615104675293, -0.19791117310523987, -0.1864061802625656, -0.17490118741989136, -0.1633961945772171, -0.15189120173454285, -0.14038622379302979, -0.12888123095035553, -0.11737623810768127, -0.10587125271558762, -0.09436626732349396, -0.0828612744808197, -0.07135628163814545, -0.05985129624605179, -0.04834630712866783, -0.036841318011283875, -0.025336328893899918, -0.01383133977651596, -0.0023263543844223022, 0.009178608655929565, 0.020683597773313522, 0.03218858689069748, 0.043693576008081436, 0.05519856512546539, 0.06670355796813965, 0.0782085433602333, 0.08971352875232697, 0.10121852159500122, 0.11272351443767548, 0.12422849982976913, 0.1357334852218628, 0.14723847806453705, 0.1587434709072113, 0.17024844884872437, 0.18175344169139862, 0.19325843453407288, 0.20476342737674713, 0.2162684202194214, 0.22777339816093445, 0.2392783910036087, 0.25078338384628296, 0.262288361787796, 0.2737933397293091, 0.28529834747314453, 0.2968033254146576, 0.30830833315849304, 0.3198133111000061, 0.33131831884384155, 0.3428232967853546, 0.3543282747268677, 0.3658332824707031, 0.3773382604122162]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 5.0, 5.0, 7.0, 8.0, 11.0, 9.0, 20.0, 17.0, 15.0, 22.0, 21.0, 34.0, 25.0, 33.0, 30.0, 41.0, 42.0, 31.0, 38.0, 46.0, 52.0, 37.0, 31.0, 29.0, 49.0, 38.0, 45.0, 39.0, 25.0, 19.0, 23.0, 21.0, 20.0, 13.0, 23.0, 14.0, 14.0, 8.0, 7.0, 10.0, 4.0, 4.0, 7.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27471062541007996, -0.26628416776657104, -0.25785771012306213, -0.24943126738071442, -0.2410048246383667, -0.2325783669948578, -0.22415190935134888, -0.21572545170783997, -0.20729900896549225, -0.19887255132198334, -0.19044610857963562, -0.1820196509361267, -0.1735931932926178, -0.16516675055027008, -0.15674029290676117, -0.14831385016441345, -0.13988739252090454, -0.13146093487739563, -0.12303449213504791, -0.114608034491539, -0.10618158429861069, -0.09775513410568237, -0.08932867646217346, -0.08090222626924515, -0.07247577607631683, -0.06404932588338852, -0.05562287196516991, -0.047196418046951294, -0.03876996785402298, -0.030343517661094666, -0.021917063742876053, -0.01349060982465744, -0.005064159631729126, 0.0033622924238443375, 0.011788744479417801, 0.020215196534991264, 0.028641648590564728, 0.03706809878349304, 0.045494552701711655, 0.05392100661993027, 0.06234745681285858, 0.0707739070057869, 0.07920035719871521, 0.08762681484222412, 0.09605326503515244, 0.10447971522808075, 0.11290617287158966, 0.12133262306451797, 0.1297590732574463, 0.1381855309009552, 0.14661197364330292, 0.15503843128681183, 0.16346487402915955, 0.17189133167266846, 0.18031778931617737, 0.18874424695968628, 0.197170689702034, 0.2055971473455429, 0.21402359008789062, 0.22245004773139954, 0.23087650537490845, 0.23930294811725616, 0.24772940576076508, 0.2561558485031128, 0.2645823061466217]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 2.0, 6.0, 9.0, 9.0, 14.0, 25.0, 34.0, 52.0, 76.0, 115.0, 191.0, 281.0, 462.0, 687.0, 1223.0, 1902.0, 3161.0, 5488.0, 9488.0, 16710.0, 30884.0, 60478.0, 132397.0, 375413.0, 1898681.0, 1193180.0, 248256.0, 102020.0, 50163.0, 26847.0, 14718.0, 8426.0, 5070.0, 3075.0, 1821.0, 1076.0, 680.0, 442.0, 273.0, 149.0, 109.0, 64.0, 38.0, 30.0, 19.0, 12.0, 5.0, 8.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.53076171875, -0.5150833129882812, -0.4994049072265625, -0.48372650146484375, -0.468048095703125, -0.45236968994140625, -0.4366912841796875, -0.42101287841796875, -0.40533447265625, -0.38965606689453125, -0.3739776611328125, -0.35829925537109375, -0.342620849609375, -0.32694244384765625, -0.3112640380859375, -0.29558563232421875, -0.2799072265625, -0.26422882080078125, -0.2485504150390625, -0.23287200927734375, -0.217193603515625, -0.20151519775390625, -0.1858367919921875, -0.17015838623046875, -0.15447998046875, -0.13880157470703125, -0.1231231689453125, -0.10744476318359375, -0.091766357421875, -0.07608795166015625, -0.0604095458984375, -0.04473114013671875, -0.029052734375, -0.01337432861328125, 0.0023040771484375, 0.01798248291015625, 0.033660888671875, 0.04933929443359375, 0.0650177001953125, 0.08069610595703125, 0.09637451171875, 0.11205291748046875, 0.1277313232421875, 0.14340972900390625, 0.159088134765625, 0.17476654052734375, 0.1904449462890625, 0.20612335205078125, 0.2218017578125, 0.23748016357421875, 0.2531585693359375, 0.26883697509765625, 0.284515380859375, 0.30019378662109375, 0.3158721923828125, 0.33155059814453125, 0.34722900390625, 0.36290740966796875, 0.3785858154296875, 0.39426422119140625, 0.409942626953125, 0.42562103271484375, 0.4412994384765625, 0.45697784423828125, 0.47265625]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 0.0, 5.0, 4.0, 9.0, 7.0, 10.0, 12.0, 23.0, 19.0, 22.0, 10.0, 23.0, 26.0, 25.0, 35.0, 46.0, 41.0, 40.0, 42.0, 32.0, 42.0, 54.0, 47.0, 40.0, 38.0, 46.0, 40.0, 33.0, 40.0, 24.0, 19.0, 20.0, 27.0, 20.0, 17.0, 10.0, 13.0, 12.0, 7.0, 5.0, 9.0, 4.0, 6.0, 0.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1700439453125, -0.164642333984375, -0.15924072265625, -0.153839111328125, -0.1484375, -0.143035888671875, -0.13763427734375, -0.132232666015625, -0.1268310546875, -0.121429443359375, -0.11602783203125, -0.110626220703125, -0.105224609375, -0.099822998046875, -0.09442138671875, -0.089019775390625, -0.0836181640625, -0.078216552734375, -0.07281494140625, -0.067413330078125, -0.06201171875, -0.056610107421875, -0.05120849609375, -0.045806884765625, -0.0404052734375, -0.035003662109375, -0.02960205078125, -0.024200439453125, -0.018798828125, -0.013397216796875, -0.00799560546875, -0.002593994140625, 0.0028076171875, 0.008209228515625, 0.01361083984375, 0.019012451171875, 0.0244140625, 0.029815673828125, 0.03521728515625, 0.040618896484375, 0.0460205078125, 0.051422119140625, 0.05682373046875, 0.062225341796875, 0.067626953125, 0.073028564453125, 0.07843017578125, 0.083831787109375, 0.0892333984375, 0.094635009765625, 0.10003662109375, 0.105438232421875, 0.11083984375, 0.116241455078125, 0.12164306640625, 0.127044677734375, 0.1324462890625, 0.137847900390625, 0.14324951171875, 0.148651123046875, 0.154052734375, 0.159454345703125, 0.16485595703125, 0.170257568359375, 0.1756591796875]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 5.0, 3.0, 3.0, 10.0, 10.0, 17.0, 29.0, 56.0, 70.0, 99.0, 163.0, 253.0, 356.0, 535.0, 846.0, 1317.0, 2009.0, 3216.0, 5183.0, 8227.0, 13858.0, 23631.0, 41692.0, 76377.0, 148510.0, 315348.0, 830661.0, 1648044.0, 570628.0, 239211.0, 117198.0, 62388.0, 34467.0, 19580.0, 11350.0, 6801.0, 4341.0, 2645.0, 1698.0, 1186.0, 728.0, 499.0, 318.0, 201.0, 182.0, 122.0, 80.0, 55.0, 34.0, 24.0, 16.0, 7.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.324462890625, -0.3144264221191406, -0.30438995361328125, -0.2943534851074219, -0.2843170166015625, -0.2742805480957031, -0.26424407958984375, -0.2542076110839844, -0.244171142578125, -0.23413467407226562, -0.22409820556640625, -0.21406173706054688, -0.2040252685546875, -0.19398880004882812, -0.18395233154296875, -0.17391586303710938, -0.16387939453125, -0.15384292602539062, -0.14380645751953125, -0.13376998901367188, -0.1237335205078125, -0.11369705200195312, -0.10366058349609375, -0.09362411499023438, -0.083587646484375, -0.07355117797851562, -0.06351470947265625, -0.053478240966796875, -0.0434417724609375, -0.033405303955078125, -0.02336883544921875, -0.013332366943359375, -0.0032958984375, 0.006740570068359375, 0.01677703857421875, 0.026813507080078125, 0.0368499755859375, 0.046886444091796875, 0.05692291259765625, 0.06695938110351562, 0.076995849609375, 0.08703231811523438, 0.09706878662109375, 0.10710525512695312, 0.1171417236328125, 0.12717819213867188, 0.13721466064453125, 0.14725112915039062, 0.15728759765625, 0.16732406616210938, 0.17736053466796875, 0.18739700317382812, 0.1974334716796875, 0.20746994018554688, 0.21750640869140625, 0.22754287719726562, 0.237579345703125, 0.24761581420898438, 0.25765228271484375, 0.2676887512207031, 0.2777252197265625, 0.2877616882324219, 0.29779815673828125, 0.3078346252441406, 0.31787109375]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 2.0, 3.0, 4.0, 6.0, 5.0, 6.0, 12.0, 12.0, 21.0, 15.0, 33.0, 28.0, 47.0, 58.0, 88.0, 99.0, 106.0, 146.0, 165.0, 184.0, 226.0, 255.0, 297.0, 347.0, 324.0, 267.0, 233.0, 206.0, 165.0, 123.0, 123.0, 95.0, 70.0, 72.0, 46.0, 41.0, 39.0, 24.0, 18.0, 16.0, 16.0, 11.0, 9.0, 5.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10321044921875, -0.10016059875488281, -0.09711074829101562, -0.09406089782714844, -0.09101104736328125, -0.08796119689941406, -0.08491134643554688, -0.08186149597167969, -0.0788116455078125, -0.07576179504394531, -0.07271194458007812, -0.06966209411621094, -0.06661224365234375, -0.06356239318847656, -0.060512542724609375, -0.05746269226074219, -0.054412841796875, -0.05136299133300781, -0.048313140869140625, -0.04526329040527344, -0.04221343994140625, -0.03916358947753906, -0.036113739013671875, -0.03306388854980469, -0.0300140380859375, -0.026964187622070312, -0.023914337158203125, -0.020864486694335938, -0.01781463623046875, -0.014764785766601562, -0.011714935302734375, -0.008665084838867188, -0.005615234375, -0.0025653839111328125, 0.000484466552734375, 0.0035343170166015625, 0.00658416748046875, 0.009634017944335938, 0.012683868408203125, 0.015733718872070312, 0.0187835693359375, 0.021833419799804688, 0.024883270263671875, 0.027933120727539062, 0.03098297119140625, 0.03403282165527344, 0.037082672119140625, 0.04013252258300781, 0.043182373046875, 0.04623222351074219, 0.049282073974609375, 0.05233192443847656, 0.05538177490234375, 0.05843162536621094, 0.061481475830078125, 0.06453132629394531, 0.0675811767578125, 0.07063102722167969, 0.07368087768554688, 0.07673072814941406, 0.07978057861328125, 0.08283042907714844, 0.08588027954101562, 0.08893013000488281, 0.09197998046875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 7.0, 12.0, 14.0, 19.0, 18.0, 18.0, 40.0, 56.0, 41.0, 72.0, 96.0, 119.0, 113.0, 92.0, 72.0, 48.0, 33.0, 28.0, 28.0, 14.0, 12.0, 8.0, 6.0, 10.0, 2.0, 4.0, 5.0, 5.0, 4.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.31889012455940247, -0.3092280328273773, -0.2995659410953522, -0.289903849363327, -0.2802417576313019, -0.27057966589927673, -0.2609175741672516, -0.25125548243522644, -0.2415933907032013, -0.23193129897117615, -0.222269207239151, -0.21260711550712585, -0.2029450237751007, -0.19328293204307556, -0.18362084031105042, -0.17395874857902527, -0.16429665684700012, -0.15463456511497498, -0.14497247338294983, -0.13531038165092468, -0.12564828991889954, -0.11598619818687439, -0.10632410645484924, -0.0966620147228241, -0.08699992299079895, -0.0773378312587738, -0.06767573952674866, -0.05801364779472351, -0.048351556062698364, -0.03868946433067322, -0.02902737259864807, -0.019365280866622925, -0.00970315933227539, -4.106760025024414e-05, 0.009621024131774902, 0.01928311586380005, 0.028945207595825195, 0.03860729932785034, 0.04826939105987549, 0.057931482791900635, 0.06759357452392578, 0.07725566625595093, 0.08691775798797607, 0.09657984972000122, 0.10624194145202637, 0.11590403318405151, 0.12556612491607666, 0.1352282166481018, 0.14489030838012695, 0.1545524001121521, 0.16421449184417725, 0.1738765835762024, 0.18353867530822754, 0.19320076704025269, 0.20286285877227783, 0.21252495050430298, 0.22218704223632812, 0.23184913396835327, 0.24151122570037842, 0.25117331743240356, 0.2608354091644287, 0.27049750089645386, 0.280159592628479, 0.28982168436050415, 0.2994837760925293]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 6.0, 5.0, 8.0, 10.0, 11.0, 12.0, 20.0, 21.0, 28.0, 34.0, 36.0, 29.0, 29.0, 39.0, 38.0, 47.0, 51.0, 56.0, 43.0, 61.0, 46.0, 45.0, 42.0, 30.0, 59.0, 30.0, 28.0, 32.0, 20.0, 22.0, 11.0, 13.0, 17.0, 6.0, 7.0, 6.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21213321387767792, -0.20558418333530426, -0.1990351676940918, -0.19248613715171814, -0.18593710660934448, -0.17938809096813202, -0.17283906042575836, -0.1662900447845459, -0.15974101424217224, -0.15319198369979858, -0.14664296805858612, -0.14009393751621246, -0.133544921875, -0.12699589133262634, -0.12044686079025269, -0.11389783769845963, -0.10734881460666656, -0.1007997915148735, -0.09425076842308044, -0.08770173788070679, -0.08115271478891373, -0.07460369169712067, -0.06805466115474701, -0.06150563806295395, -0.05495661497116089, -0.04840759187936783, -0.04185856506228447, -0.03530953824520111, -0.02876051515340805, -0.02221149206161499, -0.01566246524453163, -0.009113438427448273, -0.0025644302368164062, 0.003984594717621803, 0.010533619672060013, 0.017082644626498222, 0.023631669580936432, 0.030180692672729492, 0.03672971948981285, 0.04327874630689621, 0.04982776939868927, 0.05637679249048233, 0.06292581558227539, 0.06947484612464905, 0.07602386921644211, 0.08257289230823517, 0.08912192285060883, 0.09567094594240189, 0.10221996903419495, 0.108768992125988, 0.11531801521778107, 0.12186704576015472, 0.1284160614013672, 0.13496509194374084, 0.1415141224861145, 0.14806315302848816, 0.15461216866970062, 0.16116119921207428, 0.16771021485328674, 0.1742592453956604, 0.18080827593803406, 0.18735729157924652, 0.19390632212162018, 0.20045533776283264, 0.2070043683052063]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 1.0, 14.0, 13.0, 30.0, 38.0, 64.0, 84.0, 116.0, 217.0, 298.0, 422.0, 630.0, 995.0, 1580.0, 2464.0, 3731.0, 5806.0, 9638.0, 16867.0, 30282.0, 62367.0, 148583.0, 374740.0, 214908.0, 83983.0, 38699.0, 20748.0, 11748.0, 6970.0, 4345.0, 2853.0, 1905.0, 1192.0, 727.0, 490.0, 353.0, 232.0, 132.0, 95.0, 64.0, 43.0, 29.0, 12.0, 13.0, 14.0, 7.0, 4.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0821533203125, -0.0795602798461914, -0.07696723937988281, -0.07437419891357422, -0.07178115844726562, -0.06918811798095703, -0.06659507751464844, -0.06400203704833984, -0.06140899658203125, -0.058815956115722656, -0.05622291564941406, -0.05362987518310547, -0.051036834716796875, -0.04844379425048828, -0.04585075378417969, -0.043257713317871094, -0.0406646728515625, -0.038071632385253906, -0.03547859191894531, -0.03288555145263672, -0.030292510986328125, -0.02769947052001953, -0.025106430053710938, -0.022513389587402344, -0.01992034912109375, -0.017327308654785156, -0.014734268188476562, -0.012141227722167969, -0.009548187255859375, -0.006955146789550781, -0.0043621063232421875, -0.0017690658569335938, 0.000823974609375, 0.0034170150756835938, 0.0060100555419921875, 0.008603096008300781, 0.011196136474609375, 0.013789176940917969, 0.016382217407226562, 0.018975257873535156, 0.02156829833984375, 0.024161338806152344, 0.026754379272460938, 0.02934741973876953, 0.031940460205078125, 0.03453350067138672, 0.03712654113769531, 0.039719581604003906, 0.0423126220703125, 0.044905662536621094, 0.04749870300292969, 0.05009174346923828, 0.052684783935546875, 0.05527782440185547, 0.05787086486816406, 0.060463905334472656, 0.06305694580078125, 0.06564998626708984, 0.06824302673339844, 0.07083606719970703, 0.07342910766601562, 0.07602214813232422, 0.07861518859863281, 0.0812082290649414, 0.08380126953125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 2.0, 6.0, 9.0, 12.0, 9.0, 15.0, 17.0, 21.0, 26.0, 29.0, 25.0, 37.0, 37.0, 31.0, 45.0, 44.0, 40.0, 36.0, 48.0, 57.0, 54.0, 48.0, 34.0, 37.0, 37.0, 35.0, 38.0, 19.0, 29.0, 23.0, 20.0, 8.0, 20.0, 10.0, 10.0, 9.0, 4.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.22998046875, -0.2237377166748047, -0.21749496459960938, -0.21125221252441406, -0.20500946044921875, -0.19876670837402344, -0.19252395629882812, -0.1862812042236328, -0.1800384521484375, -0.1737957000732422, -0.16755294799804688, -0.16131019592285156, -0.15506744384765625, -0.14882469177246094, -0.14258193969726562, -0.1363391876220703, -0.130096435546875, -0.12385368347167969, -0.11761093139648438, -0.11136817932128906, -0.10512542724609375, -0.09888267517089844, -0.09263992309570312, -0.08639717102050781, -0.0801544189453125, -0.07391166687011719, -0.06766891479492188, -0.06142616271972656, -0.05518341064453125, -0.04894065856933594, -0.042697906494140625, -0.03645515441894531, -0.03021240234375, -0.023969650268554688, -0.017726898193359375, -0.011484146118164062, -0.00524139404296875, 0.0010013580322265625, 0.007244110107421875, 0.013486862182617188, 0.0197296142578125, 0.025972366333007812, 0.032215118408203125, 0.03845787048339844, 0.04470062255859375, 0.05094337463378906, 0.057186126708984375, 0.06342887878417969, 0.069671630859375, 0.07591438293457031, 0.08215713500976562, 0.08839988708496094, 0.09464263916015625, 0.10088539123535156, 0.10712814331054688, 0.11337089538574219, 0.1196136474609375, 0.1258563995361328, 0.13209915161132812, 0.13834190368652344, 0.14458465576171875, 0.15082740783691406, 0.15707015991210938, 0.1633129119873047, 0.1695556640625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 6.0, 4.0, 4.0, 5.0, 8.0, 12.0, 21.0, 31.0, 32.0, 53.0, 70.0, 99.0, 145.0, 236.0, 288.0, 451.0, 642.0, 1002.0, 1572.0, 2501.0, 3959.0, 6643.0, 11631.0, 21520.0, 42928.0, 100782.0, 361983.0, 311272.0, 92208.0, 40061.0, 20409.0, 10881.0, 6325.0, 3825.0, 2344.0, 1554.0, 981.0, 621.0, 450.0, 295.0, 202.0, 143.0, 112.0, 74.0, 49.0, 24.0, 31.0, 24.0, 16.0, 12.0, 5.0, 4.0, 6.0, 2.0, 4.0, 3.0], "bins": [-0.110107421875, -0.10695743560791016, -0.10380744934082031, -0.10065746307373047, -0.09750747680664062, -0.09435749053955078, -0.09120750427246094, -0.0880575180053711, -0.08490753173828125, -0.0817575454711914, -0.07860755920410156, -0.07545757293701172, -0.07230758666992188, -0.06915760040283203, -0.06600761413574219, -0.06285762786865234, -0.0597076416015625, -0.056557655334472656, -0.05340766906738281, -0.05025768280029297, -0.047107696533203125, -0.04395771026611328, -0.04080772399902344, -0.037657737731933594, -0.03450775146484375, -0.031357765197753906, -0.028207778930664062, -0.02505779266357422, -0.021907806396484375, -0.01875782012939453, -0.015607833862304688, -0.012457847595214844, -0.009307861328125, -0.006157875061035156, -0.0030078887939453125, 0.00014209747314453125, 0.003292083740234375, 0.006442070007324219, 0.009592056274414062, 0.012742042541503906, 0.01589202880859375, 0.019042015075683594, 0.022192001342773438, 0.02534198760986328, 0.028491973876953125, 0.03164196014404297, 0.03479194641113281, 0.037941932678222656, 0.0410919189453125, 0.044241905212402344, 0.04739189147949219, 0.05054187774658203, 0.053691864013671875, 0.05684185028076172, 0.05999183654785156, 0.0631418228149414, 0.06629180908203125, 0.0694417953491211, 0.07259178161621094, 0.07574176788330078, 0.07889175415039062, 0.08204174041748047, 0.08519172668457031, 0.08834171295166016, 0.09149169921875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 0.0, 7.0, 7.0, 10.0, 14.0, 9.0, 17.0, 9.0, 18.0, 26.0, 25.0, 27.0, 37.0, 33.0, 37.0, 32.0, 31.0, 41.0, 35.0, 34.0, 49.0, 41.0, 41.0, 43.0, 46.0, 35.0, 37.0, 32.0, 40.0, 33.0, 24.0, 17.0, 17.0, 15.0, 20.0, 7.0, 15.0, 11.0, 10.0, 3.0, 3.0, 4.0, 6.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10546875, -0.10179710388183594, -0.09812545776367188, -0.09445381164550781, -0.09078216552734375, -0.08711051940917969, -0.08343887329101562, -0.07976722717285156, -0.0760955810546875, -0.07242393493652344, -0.06875228881835938, -0.06508064270019531, -0.06140899658203125, -0.05773735046386719, -0.054065704345703125, -0.05039405822753906, -0.046722412109375, -0.04305076599121094, -0.039379119873046875, -0.03570747375488281, -0.03203582763671875, -0.028364181518554688, -0.024692535400390625, -0.021020889282226562, -0.0173492431640625, -0.013677597045898438, -0.010005950927734375, -0.0063343048095703125, -0.00266265869140625, 0.0010089874267578125, 0.004680633544921875, 0.008352279663085938, 0.01202392578125, 0.015695571899414062, 0.019367218017578125, 0.023038864135742188, 0.02671051025390625, 0.030382156372070312, 0.034053802490234375, 0.03772544860839844, 0.0413970947265625, 0.04506874084472656, 0.048740386962890625, 0.05241203308105469, 0.05608367919921875, 0.05975532531738281, 0.06342697143554688, 0.06709861755371094, 0.070770263671875, 0.07444190979003906, 0.07811355590820312, 0.08178520202636719, 0.08545684814453125, 0.08912849426269531, 0.09280014038085938, 0.09647178649902344, 0.1001434326171875, 0.10381507873535156, 0.10748672485351562, 0.11115837097167969, 0.11483001708984375, 0.11850166320800781, 0.12217330932617188, 0.12584495544433594, 0.1295166015625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 6.0, 3.0, 6.0, 6.0, 8.0, 16.0, 15.0, 18.0, 23.0, 40.0, 60.0, 86.0, 124.0, 159.0, 213.0, 327.0, 403.0, 626.0, 934.0, 1314.0, 2177.0, 3425.0, 5645.0, 10243.0, 20086.0, 48097.0, 173710.0, 606266.0, 102545.0, 34709.0, 15806.0, 8100.0, 4705.0, 2876.0, 1896.0, 1222.0, 774.0, 538.0, 362.0, 269.0, 202.0, 124.0, 100.0, 85.0, 49.0, 43.0, 29.0, 32.0, 18.0, 16.0, 10.0, 7.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.007129669189453125, -0.006902098655700684, -0.006674528121948242, -0.006446957588195801, -0.006219387054443359, -0.005991816520690918, -0.0057642459869384766, -0.005536675453186035, -0.005309104919433594, -0.005081534385681152, -0.004853963851928711, -0.0046263933181762695, -0.004398822784423828, -0.004171252250671387, -0.003943681716918945, -0.003716111183166504, -0.0034885406494140625, -0.003260970115661621, -0.0030333995819091797, -0.0028058290481567383, -0.002578258514404297, -0.0023506879806518555, -0.002123117446899414, -0.0018955469131469727, -0.0016679763793945312, -0.0014404058456420898, -0.0012128353118896484, -0.000985264778137207, -0.0007576942443847656, -0.0005301237106323242, -0.0003025531768798828, -7.49826431274414e-05, 0.000152587890625, 0.0003801584243774414, 0.0006077289581298828, 0.0008352994918823242, 0.0010628700256347656, 0.001290440559387207, 0.0015180110931396484, 0.0017455816268920898, 0.0019731521606445312, 0.0022007226943969727, 0.002428293228149414, 0.0026558637619018555, 0.002883434295654297, 0.0031110048294067383, 0.0033385753631591797, 0.003566145896911621, 0.0037937164306640625, 0.004021286964416504, 0.004248857498168945, 0.004476428031921387, 0.004703998565673828, 0.0049315690994262695, 0.005159139633178711, 0.005386710166931152, 0.005614280700683594, 0.005841851234436035, 0.0060694217681884766, 0.006296992301940918, 0.006524562835693359, 0.006752133369445801, 0.006979703903198242, 0.007207274436950684, 0.007434844970703125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 2.0, 6.0, 6.0, 5.0, 14.0, 13.0, 5.0, 19.0, 25.0, 26.0, 38.0, 45.0, 0.0, 41.0, 66.0, 51.0, 79.0, 70.0, 89.0, 70.0, 70.0, 56.0, 41.0, 35.0, 34.0, 21.0, 12.0, 8.0, 10.0, 9.0, 12.0, 6.0, 4.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.086162567138672e-06, -2.028420567512512e-06, -1.9706785678863525e-06, -1.912936568260193e-06, -1.8551945686340332e-06, -1.7974525690078735e-06, -1.7397105693817139e-06, -1.6819685697555542e-06, -1.6242265701293945e-06, -1.5664845705032349e-06, -1.5087425708770752e-06, -1.4510005712509155e-06, -1.3932585716247559e-06, -1.3355165719985962e-06, -1.2777745723724365e-06, -1.2200325727462769e-06, -1.1622905731201172e-06, -1.1045485734939575e-06, -1.0468065738677979e-06, -9.890645742416382e-07, -9.313225746154785e-07, -8.735805749893188e-07, -8.158385753631592e-07, -7.580965757369995e-07, -7.003545761108398e-07, -6.426125764846802e-07, -5.848705768585205e-07, -5.271285772323608e-07, -4.6938657760620117e-07, -4.116445779800415e-07, -3.5390257835388184e-07, -2.9616057872772217e-07, -2.384185791015625e-07, -1.8067657947540283e-07, -1.2293457984924316e-07, -6.51925802230835e-08, -7.450580596923828e-09, 5.029141902923584e-08, 1.0803341865539551e-07, 1.6577541828155518e-07, 2.2351741790771484e-07, 2.812594175338745e-07, 3.390014171600342e-07, 3.9674341678619385e-07, 4.544854164123535e-07, 5.122274160385132e-07, 5.699694156646729e-07, 6.277114152908325e-07, 6.854534149169922e-07, 7.431954145431519e-07, 8.009374141693115e-07, 8.586794137954712e-07, 9.164214134216309e-07, 9.741634130477905e-07, 1.0319054126739502e-06, 1.0896474123001099e-06, 1.1473894119262695e-06, 1.2051314115524292e-06, 1.2628734111785889e-06, 1.3206154108047485e-06, 1.3783574104309082e-06, 1.4360994100570679e-06, 1.4938414096832275e-06, 1.5515834093093872e-06, 1.6093254089355469e-06]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 6.0, 10.0, 12.0, 23.0, 19.0, 37.0, 34.0, 88.0, 130.0, 191.0, 291.0, 374.0, 577.0, 811.0, 1222.0, 1676.0, 2561.0, 3858.0, 5947.0, 9985.0, 18506.0, 38833.0, 100367.0, 470610.0, 250564.0, 72551.0, 30230.0, 15069.0, 8296.0, 5192.0, 3274.0, 2252.0, 1504.0, 1054.0, 719.0, 513.0, 348.0, 240.0, 189.0, 146.0, 88.0, 47.0, 39.0, 29.0, 20.0, 9.0, 10.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007732391357421875, -0.007473289966583252, -0.007214188575744629, -0.006955087184906006, -0.006695985794067383, -0.00643688440322876, -0.006177783012390137, -0.005918681621551514, -0.005659580230712891, -0.005400478839874268, -0.0051413774490356445, -0.0048822760581970215, -0.0046231746673583984, -0.004364073276519775, -0.004104971885681152, -0.0038458704948425293, -0.0035867691040039062, -0.003327667713165283, -0.00306856632232666, -0.002809464931488037, -0.002550363540649414, -0.002291262149810791, -0.002032160758972168, -0.001773059368133545, -0.0015139579772949219, -0.0012548565864562988, -0.0009957551956176758, -0.0007366538047790527, -0.0004775524139404297, -0.00021845102310180664, 4.0650367736816406e-05, 0.00029975175857543945, 0.0005588531494140625, 0.0008179545402526855, 0.0010770559310913086, 0.0013361573219299316, 0.0015952587127685547, 0.0018543601036071777, 0.0021134614944458008, 0.002372562885284424, 0.002631664276123047, 0.00289076566696167, 0.003149867057800293, 0.003408968448638916, 0.003668069839477539, 0.003927171230316162, 0.004186272621154785, 0.004445374011993408, 0.004704475402832031, 0.004963576793670654, 0.005222678184509277, 0.0054817795753479, 0.0057408809661865234, 0.0059999823570251465, 0.0062590837478637695, 0.006518185138702393, 0.006777286529541016, 0.007036387920379639, 0.007295489311218262, 0.007554590702056885, 0.007813692092895508, 0.00807279348373413, 0.008331894874572754, 0.008590996265411377, 0.00885009765625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 3.0, 7.0, 4.0, 13.0, 16.0, 22.0, 16.0, 28.0, 42.0, 40.0, 64.0, 80.0, 95.0, 177.0, 101.0, 60.0, 46.0, 38.0, 35.0, 25.0, 16.0, 15.0, 15.0, 5.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023708343505859375, -0.002286583185195923, -0.002202332019805908, -0.0021180808544158936, -0.002033829689025879, -0.0019495785236358643, -0.0018653273582458496, -0.001781076192855835, -0.0016968250274658203, -0.0016125738620758057, -0.001528322696685791, -0.0014440715312957764, -0.0013598203659057617, -0.001275569200515747, -0.0011913180351257324, -0.0011070668697357178, -0.0010228157043457031, -0.0009385645389556885, -0.0008543133735656738, -0.0007700622081756592, -0.0006858110427856445, -0.0006015598773956299, -0.0005173087120056152, -0.0004330575466156006, -0.00034880638122558594, -0.0002645552158355713, -0.00018030405044555664, -9.605288505554199e-05, -1.1801719665527344e-05, 7.24494457244873e-05, 0.00015670061111450195, 0.0002409517765045166, 0.00032520294189453125, 0.0004094541072845459, 0.0004937052726745605, 0.0005779564380645752, 0.0006622076034545898, 0.0007464587688446045, 0.0008307099342346191, 0.0009149610996246338, 0.0009992122650146484, 0.001083463430404663, 0.0011677145957946777, 0.0012519657611846924, 0.001336216926574707, 0.0014204680919647217, 0.0015047192573547363, 0.001588970422744751, 0.0016732215881347656, 0.0017574727535247803, 0.001841723918914795, 0.0019259750843048096, 0.0020102262496948242, 0.002094477415084839, 0.0021787285804748535, 0.002262979745864868, 0.002347230911254883, 0.0024314820766448975, 0.002515733242034912, 0.0025999844074249268, 0.0026842355728149414, 0.002768486738204956, 0.0028527379035949707, 0.0029369890689849854, 0.003021240234375]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 3.0, 11.0, 13.0, 19.0, 15.0, 20.0, 30.0, 51.0, 46.0, 63.0, 87.0, 105.0, 127.0, 91.0, 76.0, 64.0, 40.0, 30.0, 32.0, 10.0, 14.0, 10.0, 7.0, 9.0, 3.0, 5.0, 5.0, 2.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3213573694229126, -0.31171128153800964, -0.3020651936531067, -0.29241910576820374, -0.2827730178833008, -0.2731269299983978, -0.2634808421134949, -0.25383472442626953, -0.24418865144252777, -0.23454256355762482, -0.22489647567272186, -0.2152503877878189, -0.20560428500175476, -0.1959581971168518, -0.18631210923194885, -0.1766660213470459, -0.16701993346214294, -0.15737384557724, -0.14772775769233704, -0.13808166980743408, -0.12843558192253113, -0.11878948658704758, -0.10914339125156403, -0.09949730336666107, -0.08985121548175812, -0.08020512759685516, -0.07055903971195221, -0.06091294437646866, -0.051266856491565704, -0.04162076860666275, -0.0319746769964695, -0.022328585386276245, -0.012682527303695679, -0.0030364375561475754, 0.006609652191400528, 0.01625574193894863, 0.025901831686496735, 0.03554791957139969, 0.04519401118159294, 0.054840102791786194, 0.06448619067668915, 0.0741322785615921, 0.08377836644649506, 0.09342446178197861, 0.10307054966688156, 0.11271663755178452, 0.12236273288726807, 0.13200882077217102, 0.14165490865707397, 0.15130099654197693, 0.16094708442687988, 0.17059317231178284, 0.1802392601966858, 0.18988534808158875, 0.1995314508676529, 0.20917753875255585, 0.2188236266374588, 0.22846971452236176, 0.2381158024072647, 0.24776189029216766, 0.2574079930782318, 0.26705408096313477, 0.2767001688480377, 0.2863462567329407, 0.29599234461784363]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 4.0, 7.0, 12.0, 10.0, 12.0, 19.0, 23.0, 27.0, 35.0, 37.0, 26.0, 29.0, 41.0, 36.0, 50.0, 50.0, 57.0, 43.0, 59.0, 50.0, 39.0, 44.0, 33.0, 56.0, 30.0, 28.0, 31.0, 22.0, 21.0, 14.0, 12.0, 14.0, 8.0, 7.0, 7.0, 1.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21242164075374603, -0.20587141811847687, -0.1993211954832077, -0.19277097284793854, -0.18622073531150818, -0.179670512676239, -0.17312029004096985, -0.16657006740570068, -0.16001984477043152, -0.15346962213516235, -0.1469193994998932, -0.14036917686462402, -0.13381895422935486, -0.1272687315940857, -0.12071849405765533, -0.11416827142238617, -0.107618048787117, -0.10106782615184784, -0.09451760351657867, -0.08796737343072891, -0.08141715079545975, -0.07486692816019058, -0.06831669807434082, -0.061766475439071655, -0.05521625280380249, -0.048666030168533325, -0.04211580380797386, -0.0355655774474144, -0.029015354812145233, -0.022465132176876068, -0.015914905816316605, -0.009364679455757141, -0.002814456820487976, 0.003735767677426338, 0.010285992175340652, 0.016836216673254967, 0.02338644117116928, 0.029936663806438446, 0.03648689016699791, 0.04303711652755737, 0.04958733916282654, 0.0561375617980957, 0.06268778443336487, 0.06923801451921463, 0.0757882371544838, 0.08233845978975296, 0.08888868987560272, 0.09543891251087189, 0.10198913514614105, 0.10853935778141022, 0.11508958041667938, 0.12163981050252914, 0.1281900405883789, 0.13474026322364807, 0.14129048585891724, 0.1478407084941864, 0.15439093112945557, 0.16094115376472473, 0.1674913763999939, 0.17404159903526306, 0.18059182167053223, 0.1871420443058014, 0.19369228184223175, 0.20024250447750092, 0.20679272711277008]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 8.0, 8.0, 15.0, 20.0, 32.0, 46.0, 78.0, 101.0, 141.0, 252.0, 314.0, 535.0, 819.0, 1367.0, 2073.0, 3474.0, 5400.0, 8968.0, 14886.0, 25169.0, 43680.0, 79980.0, 166510.0, 329937.0, 172731.0, 81780.0, 45044.0, 25751.0, 15261.0, 9161.0, 5580.0, 3439.0, 2222.0, 1328.0, 861.0, 581.0, 341.0, 230.0, 138.0, 97.0, 56.0, 46.0, 31.0, 26.0, 16.0, 12.0, 11.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36328125, -0.3505439758300781, -0.33780670166015625, -0.3250694274902344, -0.3123321533203125, -0.2995948791503906, -0.28685760498046875, -0.2741203308105469, -0.261383056640625, -0.24864578247070312, -0.23590850830078125, -0.22317123413085938, -0.2104339599609375, -0.19769668579101562, -0.18495941162109375, -0.17222213745117188, -0.15948486328125, -0.14674758911132812, -0.13401031494140625, -0.12127304077148438, -0.1085357666015625, -0.09579849243164062, -0.08306121826171875, -0.07032394409179688, -0.057586669921875, -0.044849395751953125, -0.03211212158203125, -0.019374847412109375, -0.0066375732421875, 0.006099700927734375, 0.01883697509765625, 0.031574249267578125, 0.0443115234375, 0.057048797607421875, 0.06978607177734375, 0.08252334594726562, 0.0952606201171875, 0.10799789428710938, 0.12073516845703125, 0.13347244262695312, 0.146209716796875, 0.15894699096679688, 0.17168426513671875, 0.18442153930664062, 0.1971588134765625, 0.20989608764648438, 0.22263336181640625, 0.23537063598632812, 0.24810791015625, 0.2608451843261719, 0.27358245849609375, 0.2863197326660156, 0.2990570068359375, 0.3117942810058594, 0.32453155517578125, 0.3372688293457031, 0.350006103515625, 0.3627433776855469, 0.37548065185546875, 0.3882179260253906, 0.4009552001953125, 0.4136924743652344, 0.42642974853515625, 0.4391670227050781, 0.451904296875]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 6.0, 6.0, 8.0, 8.0, 12.0, 11.0, 18.0, 19.0, 24.0, 21.0, 22.0, 28.0, 28.0, 26.0, 28.0, 41.0, 46.0, 32.0, 47.0, 49.0, 38.0, 47.0, 44.0, 52.0, 34.0, 30.0, 41.0, 35.0, 29.0, 29.0, 20.0, 19.0, 22.0, 14.0, 12.0, 10.0, 7.0, 14.0, 3.0, 7.0, 3.0, 4.0, 4.0, 1.0, 5.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1793212890625, -0.17424774169921875, -0.1691741943359375, -0.16410064697265625, -0.159027099609375, -0.15395355224609375, -0.1488800048828125, -0.14380645751953125, -0.13873291015625, -0.13365936279296875, -0.1285858154296875, -0.12351226806640625, -0.118438720703125, -0.11336517333984375, -0.1082916259765625, -0.10321807861328125, -0.09814453125, -0.09307098388671875, -0.0879974365234375, -0.08292388916015625, -0.077850341796875, -0.07277679443359375, -0.0677032470703125, -0.06262969970703125, -0.05755615234375, -0.05248260498046875, -0.0474090576171875, -0.04233551025390625, -0.037261962890625, -0.03218841552734375, -0.0271148681640625, -0.02204132080078125, -0.0169677734375, -0.01189422607421875, -0.0068206787109375, -0.00174713134765625, 0.003326416015625, 0.00839996337890625, 0.0134735107421875, 0.01854705810546875, 0.02362060546875, 0.02869415283203125, 0.0337677001953125, 0.03884124755859375, 0.043914794921875, 0.04898834228515625, 0.0540618896484375, 0.05913543701171875, 0.064208984375, 0.06928253173828125, 0.0743560791015625, 0.07942962646484375, 0.084503173828125, 0.08957672119140625, 0.0946502685546875, 0.09972381591796875, 0.10479736328125, 0.10987091064453125, 0.1149444580078125, 0.12001800537109375, 0.125091552734375, 0.13016510009765625, 0.1352386474609375, 0.14031219482421875, 0.1453857421875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 9.0, 13.0, 16.0, 20.0, 31.0, 50.0, 79.0, 94.0, 132.0, 235.0, 303.0, 376.0, 637.0, 922.0, 1353.0, 1911.0, 2933.0, 4611.0, 7172.0, 11094.0, 17551.0, 28350.0, 46754.0, 80175.0, 148205.0, 284213.0, 177376.0, 93085.0, 53423.0, 31853.0, 19993.0, 12451.0, 7764.0, 5093.0, 3313.0, 2221.0, 1459.0, 1030.0, 702.0, 469.0, 322.0, 236.0, 165.0, 98.0, 84.0, 62.0, 42.0, 24.0, 14.0, 15.0, 9.0, 6.0, 7.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.330810546875, -0.32035064697265625, -0.3098907470703125, -0.29943084716796875, -0.288970947265625, -0.27851104736328125, -0.2680511474609375, -0.25759124755859375, -0.24713134765625, -0.23667144775390625, -0.2262115478515625, -0.21575164794921875, -0.205291748046875, -0.19483184814453125, -0.1843719482421875, -0.17391204833984375, -0.1634521484375, -0.15299224853515625, -0.1425323486328125, -0.13207244873046875, -0.121612548828125, -0.11115264892578125, -0.1006927490234375, -0.09023284912109375, -0.07977294921875, -0.06931304931640625, -0.0588531494140625, -0.04839324951171875, -0.037933349609375, -0.02747344970703125, -0.0170135498046875, -0.00655364990234375, 0.00390625, 0.01436614990234375, 0.0248260498046875, 0.03528594970703125, 0.045745849609375, 0.05620574951171875, 0.0666656494140625, 0.07712554931640625, 0.08758544921875, 0.09804534912109375, 0.1085052490234375, 0.11896514892578125, 0.129425048828125, 0.13988494873046875, 0.1503448486328125, 0.16080474853515625, 0.1712646484375, 0.18172454833984375, 0.1921844482421875, 0.20264434814453125, 0.213104248046875, 0.22356414794921875, 0.2340240478515625, 0.24448394775390625, 0.25494384765625, 0.26540374755859375, 0.2758636474609375, 0.28632354736328125, 0.296783447265625, 0.30724334716796875, 0.3177032470703125, 0.32816314697265625, 0.338623046875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 5.0, 4.0, 1.0, 1.0, 8.0, 9.0, 12.0, 12.0, 17.0, 26.0, 30.0, 29.0, 26.0, 38.0, 40.0, 46.0, 54.0, 49.0, 54.0, 43.0, 51.0, 59.0, 45.0, 42.0, 38.0, 48.0, 33.0, 25.0, 34.0, 27.0, 24.0, 15.0, 17.0, 12.0, 5.0, 6.0, 7.0, 4.0, 6.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10992431640625, -0.1061697006225586, -0.10241508483886719, -0.09866046905517578, -0.09490585327148438, -0.09115123748779297, -0.08739662170410156, -0.08364200592041016, -0.07988739013671875, -0.07613277435302734, -0.07237815856933594, -0.06862354278564453, -0.06486892700195312, -0.06111431121826172, -0.05735969543457031, -0.053605079650878906, -0.0498504638671875, -0.046095848083496094, -0.04234123229980469, -0.03858661651611328, -0.034832000732421875, -0.03107738494873047, -0.027322769165039062, -0.023568153381347656, -0.01981353759765625, -0.016058921813964844, -0.012304306030273438, -0.008549690246582031, -0.004795074462890625, -0.0010404586791992188, 0.0027141571044921875, 0.006468772888183594, 0.010223388671875, 0.013978004455566406, 0.017732620239257812, 0.02148723602294922, 0.025241851806640625, 0.02899646759033203, 0.03275108337402344, 0.036505699157714844, 0.04026031494140625, 0.044014930725097656, 0.04776954650878906, 0.05152416229248047, 0.055278778076171875, 0.05903339385986328, 0.06278800964355469, 0.0665426254272461, 0.0702972412109375, 0.0740518569946289, 0.07780647277832031, 0.08156108856201172, 0.08531570434570312, 0.08907032012939453, 0.09282493591308594, 0.09657955169677734, 0.10033416748046875, 0.10408878326416016, 0.10784339904785156, 0.11159801483154297, 0.11535263061523438, 0.11910724639892578, 0.12286186218261719, 0.1266164779663086, 0.13037109375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 6.0, 16.0, 16.0, 17.0, 34.0, 38.0, 49.0, 71.0, 107.0, 131.0, 157.0, 237.0, 330.0, 421.0, 537.0, 775.0, 1042.0, 1451.0, 2060.0, 2854.0, 4312.0, 6566.0, 10464.0, 18589.0, 42912.0, 792642.0, 96252.0, 27048.0, 13765.0, 8165.0, 5129.0, 3480.0, 2440.0, 1718.0, 1239.0, 943.0, 672.0, 503.0, 322.0, 250.0, 207.0, 160.0, 129.0, 80.0, 66.0, 28.0, 31.0, 26.0, 22.0, 32.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0], "bins": [-0.0311279296875, -0.030147552490234375, -0.02916717529296875, -0.028186798095703125, -0.0272064208984375, -0.026226043701171875, -0.02524566650390625, -0.024265289306640625, -0.023284912109375, -0.022304534912109375, -0.02132415771484375, -0.020343780517578125, -0.0193634033203125, -0.018383026123046875, -0.01740264892578125, -0.016422271728515625, -0.01544189453125, -0.014461517333984375, -0.01348114013671875, -0.012500762939453125, -0.0115203857421875, -0.010540008544921875, -0.00955963134765625, -0.008579254150390625, -0.007598876953125, -0.006618499755859375, -0.00563812255859375, -0.004657745361328125, -0.0036773681640625, -0.002696990966796875, -0.00171661376953125, -0.000736236572265625, 0.000244140625, 0.001224517822265625, 0.00220489501953125, 0.003185272216796875, 0.0041656494140625, 0.005146026611328125, 0.00612640380859375, 0.007106781005859375, 0.008087158203125, 0.009067535400390625, 0.01004791259765625, 0.011028289794921875, 0.0120086669921875, 0.012989044189453125, 0.01396942138671875, 0.014949798583984375, 0.01593017578125, 0.016910552978515625, 0.01789093017578125, 0.018871307373046875, 0.0198516845703125, 0.020832061767578125, 0.02181243896484375, 0.022792816162109375, 0.023773193359375, 0.024753570556640625, 0.02573394775390625, 0.026714324951171875, 0.0276947021484375, 0.028675079345703125, 0.02965545654296875, 0.030635833740234375, 0.0316162109375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 14.0, 5.0, 33.0, 11.0, 55.0, 175.0, 111.0, 300.0, 86.0, 114.0, 27.0, 25.0, 17.0, 3.0, 8.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.682209014892578e-06, -2.5872141122817993e-06, -2.4922192096710205e-06, -2.3972243070602417e-06, -2.302229404449463e-06, -2.207234501838684e-06, -2.1122395992279053e-06, -2.0172446966171265e-06, -1.9222497940063477e-06, -1.8272548913955688e-06, -1.73225998878479e-06, -1.6372650861740112e-06, -1.5422701835632324e-06, -1.4472752809524536e-06, -1.3522803783416748e-06, -1.257285475730896e-06, -1.1622905731201172e-06, -1.0672956705093384e-06, -9.723007678985596e-07, -8.773058652877808e-07, -7.82310962677002e-07, -6.873160600662231e-07, -5.923211574554443e-07, -4.973262548446655e-07, -4.023313522338867e-07, -3.073364496231079e-07, -2.123415470123291e-07, -1.1734664440155029e-07, -2.2351741790771484e-08, 7.264316082000732e-08, 1.6763806343078613e-07, 2.6263296604156494e-07, 3.5762786865234375e-07, 4.5262277126312256e-07, 5.476176738739014e-07, 6.426125764846802e-07, 7.37607479095459e-07, 8.326023817062378e-07, 9.275972843170166e-07, 1.0225921869277954e-06, 1.1175870895385742e-06, 1.212581992149353e-06, 1.3075768947601318e-06, 1.4025717973709106e-06, 1.4975666999816895e-06, 1.5925616025924683e-06, 1.687556505203247e-06, 1.7825514078140259e-06, 1.8775463104248047e-06, 1.9725412130355835e-06, 2.0675361156463623e-06, 2.162531018257141e-06, 2.25752592086792e-06, 2.3525208234786987e-06, 2.4475157260894775e-06, 2.5425106287002563e-06, 2.637505531311035e-06, 2.732500433921814e-06, 2.8274953365325928e-06, 2.9224902391433716e-06, 3.0174851417541504e-06, 3.112480044364929e-06, 3.207474946975708e-06, 3.302469849586487e-06, 3.3974647521972656e-06]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 5.0, 13.0, 7.0, 31.0, 26.0, 45.0, 56.0, 98.0, 136.0, 175.0, 259.0, 384.0, 550.0, 792.0, 1129.0, 1696.0, 2642.0, 4245.0, 7356.0, 15596.0, 47852.0, 859552.0, 65394.0, 18657.0, 8593.0, 4756.0, 2856.0, 1810.0, 1171.0, 812.0, 560.0, 348.0, 273.0, 208.0, 127.0, 81.0, 79.0, 48.0, 42.0, 33.0, 19.0, 12.0, 11.0, 6.0, 4.0, 6.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.044158935546875, -0.04271554946899414, -0.04127216339111328, -0.03982877731323242, -0.03838539123535156, -0.0369420051574707, -0.035498619079589844, -0.034055233001708984, -0.032611846923828125, -0.031168460845947266, -0.029725074768066406, -0.028281688690185547, -0.026838302612304688, -0.025394916534423828, -0.02395153045654297, -0.02250814437866211, -0.02106475830078125, -0.01962137222290039, -0.01817798614501953, -0.016734600067138672, -0.015291213989257812, -0.013847827911376953, -0.012404441833496094, -0.010961055755615234, -0.009517669677734375, -0.008074283599853516, -0.006630897521972656, -0.005187511444091797, -0.0037441253662109375, -0.002300739288330078, -0.0008573532104492188, 0.0005860328674316406, 0.0020294189453125, 0.0034728050231933594, 0.004916191101074219, 0.006359577178955078, 0.0078029632568359375, 0.009246349334716797, 0.010689735412597656, 0.012133121490478516, 0.013576507568359375, 0.015019893646240234, 0.016463279724121094, 0.017906665802001953, 0.019350051879882812, 0.020793437957763672, 0.02223682403564453, 0.02368021011352539, 0.02512359619140625, 0.02656698226928711, 0.02801036834716797, 0.029453754425048828, 0.030897140502929688, 0.03234052658081055, 0.033783912658691406, 0.035227298736572266, 0.036670684814453125, 0.038114070892333984, 0.039557456970214844, 0.0410008430480957, 0.04244422912597656, 0.04388761520385742, 0.04533100128173828, 0.04677438735961914, 0.0482177734375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 3.0, 7.0, 2.0, 4.0, 4.0, 6.0, 3.0, 9.0, 8.0, 7.0, 18.0, 19.0, 40.0, 81.0, 550.0, 99.0, 27.0, 26.0, 18.0, 10.0, 19.0, 5.0, 7.0, 5.0, 5.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01084136962890625, -0.010498762130737305, -0.01015615463256836, -0.009813547134399414, -0.009470939636230469, -0.009128332138061523, -0.008785724639892578, -0.008443117141723633, -0.008100509643554688, -0.007757902145385742, -0.007415294647216797, -0.0070726871490478516, -0.006730079650878906, -0.006387472152709961, -0.006044864654541016, -0.00570225715637207, -0.005359649658203125, -0.00501704216003418, -0.004674434661865234, -0.004331827163696289, -0.003989219665527344, -0.0036466121673583984, -0.003304004669189453, -0.002961397171020508, -0.0026187896728515625, -0.002276182174682617, -0.0019335746765136719, -0.0015909671783447266, -0.0012483596801757812, -0.0009057521820068359, -0.0005631446838378906, -0.0002205371856689453, 0.0001220703125, 0.0004646778106689453, 0.0008072853088378906, 0.001149892807006836, 0.0014925003051757812, 0.0018351078033447266, 0.002177715301513672, 0.002520322799682617, 0.0028629302978515625, 0.003205537796020508, 0.003548145294189453, 0.0038907527923583984, 0.004233360290527344, 0.004575967788696289, 0.004918575286865234, 0.00526118278503418, 0.005603790283203125, 0.00594639778137207, 0.006289005279541016, 0.006631612777709961, 0.006974220275878906, 0.0073168277740478516, 0.007659435272216797, 0.008002042770385742, 0.008344650268554688, 0.008687257766723633, 0.009029865264892578, 0.009372472763061523, 0.009715080261230469, 0.010057687759399414, 0.01040029525756836, 0.010742902755737305, 0.01108551025390625]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 8.0, 3.0, 2.0, 8.0, 2.0, 7.0, 16.0, 5.0, 14.0, 16.0, 22.0, 24.0, 34.0, 56.0, 63.0, 109.0, 119.0, 111.0, 111.0, 57.0, 41.0, 38.0, 31.0, 17.0, 16.0, 19.0, 9.0, 13.0, 9.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.28838932514190674, -0.27993184328079224, -0.27147436141967773, -0.26301687955856323, -0.25455939769744873, -0.24610193073749542, -0.23764446377754211, -0.2291869819164276, -0.2207295000553131, -0.2122720181941986, -0.2038145363330841, -0.1953570693731308, -0.1868995875120163, -0.1784421056509018, -0.1699846386909485, -0.16152715682983398, -0.15306967496871948, -0.14461219310760498, -0.13615471124649048, -0.12769724428653717, -0.11923976242542267, -0.11078228056430817, -0.10232480615377426, -0.09386733174324036, -0.08540984988212585, -0.07695236802101135, -0.06849489361047745, -0.060037415474653244, -0.05157993733882904, -0.04312245920300484, -0.034664981067180634, -0.02620750293135643, -0.017750024795532227, -0.009292546659708023, -0.0008350685238838196, 0.007622409611940384, 0.016079887747764587, 0.02453736588358879, 0.032994844019412994, 0.0414523221552372, 0.0499098002910614, 0.058367278426885605, 0.06682475656270981, 0.07528223097324371, 0.08373971283435822, 0.09219719469547272, 0.10065466910600662, 0.10911214351654053, 0.11756962537765503, 0.12602710723876953, 0.13448458909988403, 0.14294205605983734, 0.15139953792095184, 0.15985701978206635, 0.16831448674201965, 0.17677196860313416, 0.18522945046424866, 0.19368693232536316, 0.20214441418647766, 0.21060188114643097, 0.21905936300754547, 0.22751684486865997, 0.23597431182861328, 0.24443179368972778, 0.2528892755508423]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 11.0, 9.0, 6.0, 10.0, 9.0, 13.0, 11.0, 33.0, 40.0, 30.0, 27.0, 34.0, 41.0, 41.0, 58.0, 50.0, 58.0, 50.0, 50.0, 49.0, 47.0, 38.0, 53.0, 36.0, 44.0, 33.0, 22.0, 20.0, 19.0, 13.0, 12.0, 8.0, 8.0, 9.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18577787280082703, -0.17945516109466553, -0.17313244938850403, -0.16680973768234253, -0.16048702597618103, -0.15416431427001953, -0.14784160256385803, -0.14151889085769653, -0.13519617915153503, -0.12887346744537354, -0.12255075573921204, -0.11622804403305054, -0.10990533232688904, -0.10358262062072754, -0.09725990146398544, -0.09093718975782394, -0.08461447060108185, -0.07829175889492035, -0.07196904718875885, -0.06564633548259735, -0.059323620051145554, -0.053000908344984055, -0.04667819291353226, -0.04035548120737076, -0.03403276950120926, -0.02771005779504776, -0.021387344226241112, -0.015064630657434464, -0.008741918951272964, -0.0024192072451114655, 0.003903508186340332, 0.010226219892501831, 0.01654893159866333, 0.02287164330482483, 0.029194356873631477, 0.035517070442438126, 0.041839782148599625, 0.048162493854761124, 0.05448520928621292, 0.06080792099237442, 0.06713063269853592, 0.07345334440469742, 0.07977605611085892, 0.08609877526760101, 0.09242148697376251, 0.09874419867992401, 0.10506691038608551, 0.11138962209224701, 0.11771233379840851, 0.12403504550457001, 0.1303577572107315, 0.136680468916893, 0.1430031806230545, 0.149325892329216, 0.1556486189365387, 0.1619713306427002, 0.1682940423488617, 0.1746167540550232, 0.1809394657611847, 0.1872621774673462, 0.1935848891735077, 0.1999076008796692, 0.2062303125858307, 0.2125530242919922, 0.2188757359981537]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 5.0, 4.0, 4.0, 10.0, 18.0, 25.0, 35.0, 54.0, 58.0, 110.0, 164.0, 223.0, 329.0, 500.0, 725.0, 1089.0, 1611.0, 2526.0, 3861.0, 6039.0, 10202.0, 17364.0, 30962.0, 59292.0, 124318.0, 328361.0, 1678849.0, 1403809.0, 289708.0, 110477.0, 53537.0, 28431.0, 15969.0, 9334.0, 5789.0, 3632.0, 2352.0, 1508.0, 965.0, 668.0, 457.0, 297.0, 188.0, 127.0, 107.0, 69.0, 40.0, 25.0, 19.0, 14.0, 13.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.275390625, -0.2664909362792969, -0.25759124755859375, -0.24869155883789062, -0.2397918701171875, -0.23089218139648438, -0.22199249267578125, -0.21309280395507812, -0.204193115234375, -0.19529342651367188, -0.18639373779296875, -0.17749404907226562, -0.1685943603515625, -0.15969467163085938, -0.15079498291015625, -0.14189529418945312, -0.13299560546875, -0.12409591674804688, -0.11519622802734375, -0.10629653930664062, -0.0973968505859375, -0.08849716186523438, -0.07959747314453125, -0.07069778442382812, -0.061798095703125, -0.052898406982421875, -0.04399871826171875, -0.035099029541015625, -0.0261993408203125, -0.017299652099609375, -0.00839996337890625, 0.000499725341796875, 0.0093994140625, 0.018299102783203125, 0.02719879150390625, 0.036098480224609375, 0.0449981689453125, 0.053897857666015625, 0.06279754638671875, 0.07169723510742188, 0.080596923828125, 0.08949661254882812, 0.09839630126953125, 0.10729598999023438, 0.1161956787109375, 0.12509536743164062, 0.13399505615234375, 0.14289474487304688, 0.15179443359375, 0.16069412231445312, 0.16959381103515625, 0.17849349975585938, 0.1873931884765625, 0.19629287719726562, 0.20519256591796875, 0.21409225463867188, 0.222991943359375, 0.23189163208007812, 0.24079132080078125, 0.24969100952148438, 0.2585906982421875, 0.2674903869628906, 0.27639007568359375, 0.2852897644042969, 0.294189453125]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 9.0, 11.0, 9.0, 10.0, 11.0, 17.0, 30.0, 21.0, 28.0, 24.0, 25.0, 29.0, 37.0, 43.0, 36.0, 40.0, 53.0, 46.0, 45.0, 49.0, 51.0, 41.0, 31.0, 36.0, 36.0, 35.0, 28.0, 27.0, 29.0, 13.0, 14.0, 10.0, 14.0, 7.0, 3.0, 12.0, 5.0, 9.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.10565185546875, -0.10254096984863281, -0.09943008422851562, -0.09631919860839844, -0.09320831298828125, -0.09009742736816406, -0.08698654174804688, -0.08387565612792969, -0.0807647705078125, -0.07765388488769531, -0.07454299926757812, -0.07143211364746094, -0.06832122802734375, -0.06521034240722656, -0.062099456787109375, -0.05898857116699219, -0.055877685546875, -0.05276679992675781, -0.049655914306640625, -0.04654502868652344, -0.04343414306640625, -0.04032325744628906, -0.037212371826171875, -0.03410148620605469, -0.0309906005859375, -0.027879714965820312, -0.024768829345703125, -0.021657943725585938, -0.01854705810546875, -0.015436172485351562, -0.012325286865234375, -0.009214401245117188, -0.006103515625, -0.0029926300048828125, 0.000118255615234375, 0.0032291412353515625, 0.00634002685546875, 0.009450912475585938, 0.012561798095703125, 0.015672683715820312, 0.0187835693359375, 0.021894454956054688, 0.025005340576171875, 0.028116226196289062, 0.03122711181640625, 0.03433799743652344, 0.037448883056640625, 0.04055976867675781, 0.043670654296875, 0.04678153991699219, 0.049892425537109375, 0.05300331115722656, 0.05611419677734375, 0.05922508239746094, 0.062335968017578125, 0.06544685363769531, 0.0685577392578125, 0.07166862487792969, 0.07477951049804688, 0.07789039611816406, 0.08100128173828125, 0.08411216735839844, 0.08722305297851562, 0.09033393859863281, 0.09344482421875]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 5.0, 11.0, 16.0, 19.0, 29.0, 45.0, 58.0, 59.0, 125.0, 169.0, 241.0, 374.0, 454.0, 728.0, 1013.0, 1372.0, 1996.0, 2938.0, 4300.0, 6298.0, 9318.0, 14327.0, 22141.0, 34886.0, 57113.0, 96774.0, 173471.0, 338568.0, 797293.0, 1444557.0, 567434.0, 263713.0, 139573.0, 80343.0, 48239.0, 29446.0, 18876.0, 12060.0, 8070.0, 5483.0, 3819.0, 2574.0, 1810.0, 1271.0, 885.0, 599.0, 424.0, 310.0, 202.0, 137.0, 100.0, 84.0, 48.0, 31.0, 20.0, 17.0, 13.0, 7.0, 0.0, 2.0, 8.0], "bins": [-0.1527099609375, -0.14798545837402344, -0.14326095581054688, -0.1385364532470703, -0.13381195068359375, -0.1290874481201172, -0.12436294555664062, -0.11963844299316406, -0.1149139404296875, -0.11018943786621094, -0.10546493530273438, -0.10074043273925781, -0.09601593017578125, -0.09129142761230469, -0.08656692504882812, -0.08184242248535156, -0.077117919921875, -0.07239341735839844, -0.06766891479492188, -0.06294441223144531, -0.05821990966796875, -0.05349540710449219, -0.048770904541015625, -0.04404640197753906, -0.0393218994140625, -0.03459739685058594, -0.029872894287109375, -0.025148391723632812, -0.02042388916015625, -0.015699386596679688, -0.010974884033203125, -0.0062503814697265625, -0.00152587890625, 0.0031986236572265625, 0.007923126220703125, 0.012647628784179688, 0.01737213134765625, 0.022096633911132812, 0.026821136474609375, 0.03154563903808594, 0.0362701416015625, 0.04099464416503906, 0.045719146728515625, 0.05044364929199219, 0.05516815185546875, 0.05989265441894531, 0.06461715698242188, 0.06934165954589844, 0.074066162109375, 0.07879066467285156, 0.08351516723632812, 0.08823966979980469, 0.09296417236328125, 0.09768867492675781, 0.10241317749023438, 0.10713768005371094, 0.1118621826171875, 0.11658668518066406, 0.12131118774414062, 0.1260356903076172, 0.13076019287109375, 0.1354846954345703, 0.14020919799804688, 0.14493370056152344, 0.149658203125]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 7.0, 11.0, 9.0, 10.0, 12.0, 11.0, 21.0, 15.0, 33.0, 41.0, 48.0, 58.0, 70.0, 90.0, 107.0, 111.0, 138.0, 186.0, 192.0, 259.0, 298.0, 334.0, 336.0, 276.0, 251.0, 218.0, 156.0, 149.0, 116.0, 98.0, 79.0, 68.0, 61.0, 37.0, 26.0, 33.0, 19.0, 29.0, 14.0, 8.0, 9.0, 9.0, 6.0, 5.0, 3.0, 3.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.052978515625, -0.051321983337402344, -0.04966545104980469, -0.04800891876220703, -0.046352386474609375, -0.04469585418701172, -0.04303932189941406, -0.041382789611816406, -0.03972625732421875, -0.038069725036621094, -0.03641319274902344, -0.03475666046142578, -0.033100128173828125, -0.03144359588623047, -0.029787063598632812, -0.028130531311035156, -0.0264739990234375, -0.024817466735839844, -0.023160934448242188, -0.02150440216064453, -0.019847869873046875, -0.01819133758544922, -0.016534805297851562, -0.014878273010253906, -0.01322174072265625, -0.011565208435058594, -0.009908676147460938, -0.008252143859863281, -0.006595611572265625, -0.004939079284667969, -0.0032825469970703125, -0.0016260147094726562, 3.0517578125e-05, 0.0016870498657226562, 0.0033435821533203125, 0.005000114440917969, 0.006656646728515625, 0.008313179016113281, 0.009969711303710938, 0.011626243591308594, 0.01328277587890625, 0.014939308166503906, 0.016595840454101562, 0.01825237274169922, 0.019908905029296875, 0.02156543731689453, 0.023221969604492188, 0.024878501892089844, 0.0265350341796875, 0.028191566467285156, 0.029848098754882812, 0.03150463104248047, 0.033161163330078125, 0.03481769561767578, 0.03647422790527344, 0.038130760192871094, 0.03978729248046875, 0.041443824768066406, 0.04310035705566406, 0.04475688934326172, 0.046413421630859375, 0.04806995391845703, 0.04972648620605469, 0.051383018493652344, 0.05303955078125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 1.0, 2.0, 6.0, 4.0, 7.0, 3.0, 8.0, 11.0, 17.0, 20.0, 19.0, 36.0, 38.0, 34.0, 41.0, 68.0, 84.0, 102.0, 101.0, 74.0, 61.0, 53.0, 32.0, 35.0, 32.0, 23.0, 17.0, 10.0, 11.0, 9.0, 6.0, 9.0, 5.0, 6.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.13841359317302704, -0.13380412757396698, -0.12919466197490692, -0.12458519637584686, -0.1199757307767868, -0.11536626517772675, -0.11075679957866669, -0.10614733397960663, -0.10153786838054657, -0.09692840278148651, -0.09231893718242645, -0.0877094715833664, -0.08310000598430634, -0.07849054038524628, -0.07388107478618622, -0.06927160918712616, -0.0646621435880661, -0.06005267798900604, -0.055443212389945984, -0.050833746790885925, -0.04622428119182587, -0.04161481559276581, -0.03700534999370575, -0.03239588439464569, -0.027786418795585632, -0.023176953196525574, -0.018567487597465515, -0.013958021998405457, -0.009348556399345398, -0.004739090800285339, -0.00012962520122528076, 0.004479840397834778, 0.009089291095733643, 0.013698756694793701, 0.01830822229385376, 0.02291768789291382, 0.027527153491973877, 0.032136619091033936, 0.036746084690093994, 0.04135555028915405, 0.04596501588821411, 0.05057448148727417, 0.05518394708633423, 0.05979341268539429, 0.06440287828445435, 0.0690123438835144, 0.07362180948257446, 0.07823127508163452, 0.08284074068069458, 0.08745020627975464, 0.0920596718788147, 0.09666913747787476, 0.10127860307693481, 0.10588806867599487, 0.11049753427505493, 0.11510699987411499, 0.11971646547317505, 0.12432593107223511, 0.12893539667129517, 0.13354486227035522, 0.13815432786941528, 0.14276379346847534, 0.1473732590675354, 0.15198272466659546, 0.15659219026565552]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 7.0, 9.0, 8.0, 12.0, 14.0, 20.0, 19.0, 21.0, 31.0, 39.0, 32.0, 38.0, 35.0, 46.0, 45.0, 36.0, 55.0, 59.0, 42.0, 41.0, 45.0, 51.0, 44.0, 42.0, 39.0, 42.0, 27.0, 16.0, 10.0, 20.0, 14.0, 13.0, 11.0, 5.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.114858478307724, -0.11095969378948212, -0.10706091672182083, -0.10316213220357895, -0.09926334768533707, -0.09536457061767578, -0.0914657860994339, -0.08756700158119202, -0.08366822451353073, -0.07976943999528885, -0.07587066292762756, -0.07197187840938568, -0.0680730938911438, -0.06417431682348251, -0.06027553230524063, -0.05637675151228905, -0.052477966994047165, -0.04857918620109558, -0.0446804016828537, -0.040781620889902115, -0.03688284009695053, -0.03298405557870865, -0.029085274785757065, -0.02518649399280548, -0.021287711337208748, -0.017388928681612015, -0.013490147888660431, -0.009591365233063698, -0.005692583508789539, -0.0017938017845153809, 0.0021049808710813522, 0.006003761664032936, 0.00990254431962967, 0.013801326043903828, 0.017700107768177986, 0.02159889042377472, 0.025497671216726303, 0.029396453872323036, 0.03329523652791977, 0.03719401732087135, 0.04109279811382294, 0.04499157890677452, 0.0488903634250164, 0.05278914421796799, 0.05668792501091957, 0.060586705803871155, 0.06448549032211304, 0.06838427484035492, 0.0722830593585968, 0.07618184387683868, 0.08008062094449997, 0.08397940546274185, 0.08787818998098373, 0.09177696704864502, 0.0956757515668869, 0.09957453608512878, 0.10347331315279007, 0.10737209767103195, 0.11127087473869324, 0.11516965925693512, 0.119068443775177, 0.12296722084283829, 0.12686601281166077, 0.13076478242874146, 0.13466356694698334]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 9.0, 15.0, 13.0, 26.0, 44.0, 76.0, 87.0, 127.0, 214.0, 342.0, 492.0, 741.0, 1173.0, 1666.0, 2675.0, 4179.0, 6703.0, 11066.0, 18347.0, 31844.0, 59522.0, 122693.0, 304680.0, 254154.0, 104011.0, 52049.0, 28468.0, 16499.0, 9750.0, 5971.0, 3778.0, 2510.0, 1574.0, 976.0, 705.0, 451.0, 302.0, 208.0, 129.0, 85.0, 60.0, 47.0, 31.0, 21.0, 17.0, 6.0, 7.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.039764404296875, -0.03855562210083008, -0.037346839904785156, -0.036138057708740234, -0.03492927551269531, -0.03372049331665039, -0.03251171112060547, -0.03130292892456055, -0.030094146728515625, -0.028885364532470703, -0.02767658233642578, -0.02646780014038086, -0.025259017944335938, -0.024050235748291016, -0.022841453552246094, -0.021632671356201172, -0.02042388916015625, -0.019215106964111328, -0.018006324768066406, -0.016797542572021484, -0.015588760375976562, -0.01437997817993164, -0.013171195983886719, -0.011962413787841797, -0.010753631591796875, -0.009544849395751953, -0.008336067199707031, -0.007127285003662109, -0.0059185028076171875, -0.004709720611572266, -0.0035009384155273438, -0.002292156219482422, -0.0010833740234375, 0.00012540817260742188, 0.0013341903686523438, 0.0025429725646972656, 0.0037517547607421875, 0.004960536956787109, 0.006169319152832031, 0.007378101348876953, 0.008586883544921875, 0.009795665740966797, 0.011004447937011719, 0.01221323013305664, 0.013422012329101562, 0.014630794525146484, 0.015839576721191406, 0.017048358917236328, 0.01825714111328125, 0.019465923309326172, 0.020674705505371094, 0.021883487701416016, 0.023092269897460938, 0.02430105209350586, 0.02550983428955078, 0.026718616485595703, 0.027927398681640625, 0.029136180877685547, 0.03034496307373047, 0.03155374526977539, 0.03276252746582031, 0.033971309661865234, 0.035180091857910156, 0.03638887405395508, 0.03759765625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 4.0, 7.0, 5.0, 14.0, 6.0, 18.0, 23.0, 24.0, 25.0, 24.0, 31.0, 34.0, 33.0, 50.0, 42.0, 41.0, 49.0, 42.0, 53.0, 48.0, 46.0, 44.0, 35.0, 57.0, 46.0, 30.0, 34.0, 25.0, 24.0, 10.0, 14.0, 15.0, 13.0, 7.0, 7.0, 9.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1102294921875, -0.10632705688476562, -0.10242462158203125, -0.09852218627929688, -0.0946197509765625, -0.09071731567382812, -0.08681488037109375, -0.08291244506835938, -0.079010009765625, -0.07510757446289062, -0.07120513916015625, -0.06730270385742188, -0.0634002685546875, -0.059497833251953125, -0.05559539794921875, -0.051692962646484375, -0.04779052734375, -0.043888092041015625, -0.03998565673828125, -0.036083221435546875, -0.0321807861328125, -0.028278350830078125, -0.02437591552734375, -0.020473480224609375, -0.016571044921875, -0.012668609619140625, -0.00876617431640625, -0.004863739013671875, -0.0009613037109375, 0.002941131591796875, 0.00684356689453125, 0.010746002197265625, 0.0146484375, 0.018550872802734375, 0.02245330810546875, 0.026355743408203125, 0.0302581787109375, 0.034160614013671875, 0.03806304931640625, 0.041965484619140625, 0.045867919921875, 0.049770355224609375, 0.05367279052734375, 0.057575225830078125, 0.0614776611328125, 0.06538009643554688, 0.06928253173828125, 0.07318496704101562, 0.07708740234375, 0.08098983764648438, 0.08489227294921875, 0.08879470825195312, 0.0926971435546875, 0.09659957885742188, 0.10050201416015625, 0.10440444946289062, 0.108306884765625, 0.11220932006835938, 0.11611175537109375, 0.12001419067382812, 0.1239166259765625, 0.12781906127929688, 0.13172149658203125, 0.13562393188476562, 0.1395263671875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 7.0, 10.0, 9.0, 13.0, 12.0, 31.0, 36.0, 56.0, 63.0, 90.0, 143.0, 165.0, 267.0, 361.0, 565.0, 777.0, 1273.0, 1970.0, 3120.0, 5223.0, 9029.0, 16394.0, 32062.0, 71228.0, 210890.0, 464390.0, 125155.0, 49709.0, 24058.0, 12638.0, 7121.0, 4255.0, 2519.0, 1658.0, 1032.0, 699.0, 453.0, 333.0, 206.0, 143.0, 105.0, 87.0, 51.0, 47.0, 25.0, 24.0, 17.0, 7.0, 10.0, 7.0, 4.0, 0.0, 5.0, 1.0, 2.0, 4.0], "bins": [-0.059173583984375, -0.05739593505859375, -0.0556182861328125, -0.05384063720703125, -0.05206298828125, -0.05028533935546875, -0.0485076904296875, -0.04673004150390625, -0.044952392578125, -0.04317474365234375, -0.0413970947265625, -0.03961944580078125, -0.037841796875, -0.03606414794921875, -0.0342864990234375, -0.03250885009765625, -0.030731201171875, -0.02895355224609375, -0.0271759033203125, -0.02539825439453125, -0.02362060546875, -0.02184295654296875, -0.0200653076171875, -0.01828765869140625, -0.016510009765625, -0.01473236083984375, -0.0129547119140625, -0.01117706298828125, -0.0093994140625, -0.00762176513671875, -0.0058441162109375, -0.00406646728515625, -0.002288818359375, -0.00051116943359375, 0.0012664794921875, 0.00304412841796875, 0.00482177734375, 0.00659942626953125, 0.0083770751953125, 0.01015472412109375, 0.011932373046875, 0.01371002197265625, 0.0154876708984375, 0.01726531982421875, 0.01904296875, 0.02082061767578125, 0.0225982666015625, 0.02437591552734375, 0.026153564453125, 0.02793121337890625, 0.0297088623046875, 0.03148651123046875, 0.03326416015625, 0.03504180908203125, 0.0368194580078125, 0.03859710693359375, 0.040374755859375, 0.04215240478515625, 0.0439300537109375, 0.04570770263671875, 0.0474853515625, 0.04926300048828125, 0.0510406494140625, 0.05281829833984375, 0.054595947265625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 4.0, 4.0, 8.0, 7.0, 11.0, 14.0, 13.0, 24.0, 16.0, 15.0, 29.0, 25.0, 31.0, 40.0, 33.0, 36.0, 40.0, 47.0, 49.0, 47.0, 47.0, 46.0, 29.0, 36.0, 35.0, 33.0, 53.0, 26.0, 33.0, 21.0, 23.0, 26.0, 20.0, 13.0, 11.0, 10.0, 11.0, 11.0, 6.0, 2.0, 3.0, 10.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0760498046875, -0.0737924575805664, -0.07153511047363281, -0.06927776336669922, -0.06702041625976562, -0.06476306915283203, -0.06250572204589844, -0.060248374938964844, -0.05799102783203125, -0.055733680725097656, -0.05347633361816406, -0.05121898651123047, -0.048961639404296875, -0.04670429229736328, -0.04444694519042969, -0.042189598083496094, -0.0399322509765625, -0.037674903869628906, -0.03541755676269531, -0.03316020965576172, -0.030902862548828125, -0.02864551544189453, -0.026388168334960938, -0.024130821228027344, -0.02187347412109375, -0.019616127014160156, -0.017358779907226562, -0.015101432800292969, -0.012844085693359375, -0.010586738586425781, -0.008329391479492188, -0.006072044372558594, -0.003814697265625, -0.0015573501586914062, 0.0006999969482421875, 0.0029573440551757812, 0.005214691162109375, 0.007472038269042969, 0.009729385375976562, 0.011986732482910156, 0.01424407958984375, 0.016501426696777344, 0.018758773803710938, 0.02101612091064453, 0.023273468017578125, 0.02553081512451172, 0.027788162231445312, 0.030045509338378906, 0.0323028564453125, 0.034560203552246094, 0.03681755065917969, 0.03907489776611328, 0.041332244873046875, 0.04358959197998047, 0.04584693908691406, 0.048104286193847656, 0.05036163330078125, 0.052618980407714844, 0.05487632751464844, 0.05713367462158203, 0.059391021728515625, 0.06164836883544922, 0.06390571594238281, 0.0661630630493164, 0.06842041015625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 3.0, 9.0, 4.0, 11.0, 4.0, 11.0, 7.0, 18.0, 29.0, 34.0, 56.0, 51.0, 98.0, 107.0, 157.0, 241.0, 350.0, 543.0, 766.0, 1234.0, 2078.0, 3362.0, 5860.0, 11156.0, 23389.0, 57185.0, 250854.0, 554979.0, 76272.0, 28944.0, 13441.0, 6986.0, 3860.0, 2260.0, 1395.0, 921.0, 579.0, 378.0, 245.0, 199.0, 152.0, 86.0, 57.0, 51.0, 32.0, 26.0, 14.0, 26.0, 14.0, 9.0, 4.0, 8.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 2.0], "bins": [-0.0045928955078125, -0.004429638385772705, -0.00426638126373291, -0.004103124141693115, -0.00393986701965332, -0.0037766098976135254, -0.0036133527755737305, -0.0034500956535339355, -0.0032868385314941406, -0.0031235814094543457, -0.0029603242874145508, -0.002797067165374756, -0.002633810043334961, -0.002470552921295166, -0.002307295799255371, -0.002144038677215576, -0.0019807815551757812, -0.0018175244331359863, -0.0016542673110961914, -0.0014910101890563965, -0.0013277530670166016, -0.0011644959449768066, -0.0010012388229370117, -0.0008379817008972168, -0.0006747245788574219, -0.000511467456817627, -0.00034821033477783203, -0.0001849532127380371, -2.1696090698242188e-05, 0.00014156103134155273, 0.00030481815338134766, 0.0004680752754211426, 0.0006313323974609375, 0.0007945895195007324, 0.0009578466415405273, 0.0011211037635803223, 0.0012843608856201172, 0.0014476180076599121, 0.001610875129699707, 0.001774132251739502, 0.0019373893737792969, 0.002100646495819092, 0.0022639036178588867, 0.0024271607398986816, 0.0025904178619384766, 0.0027536749839782715, 0.0029169321060180664, 0.0030801892280578613, 0.0032434463500976562, 0.003406703472137451, 0.003569960594177246, 0.003733217716217041, 0.003896474838256836, 0.004059731960296631, 0.004222989082336426, 0.004386246204376221, 0.004549503326416016, 0.0047127604484558105, 0.0048760175704956055, 0.0050392746925354, 0.005202531814575195, 0.00536578893661499, 0.005529046058654785, 0.00569230318069458, 0.005855560302734375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 6.0, 0.0, 14.0, 27.0, 21.0, 0.0, 40.0, 55.0, 69.0, 0.0, 83.0, 114.0, 105.0, 0.0, 102.0, 87.0, 73.0, 0.0, 55.0, 35.0, 30.0, 0.0, 26.0, 13.0, 12.0, 0.0, 10.0, 6.0, 2.0, 0.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3709068298339844e-06, -1.3262033462524414e-06, -1.2814998626708984e-06, -1.2367963790893555e-06, -1.1920928955078125e-06, -1.1473894119262695e-06, -1.1026859283447266e-06, -1.0579824447631836e-06, -1.0132789611816406e-06, -9.685754776000977e-07, -9.238719940185547e-07, -8.791685104370117e-07, -8.344650268554688e-07, -7.897615432739258e-07, -7.450580596923828e-07, -7.003545761108398e-07, -6.556510925292969e-07, -6.109476089477539e-07, -5.662441253662109e-07, -5.21540641784668e-07, -4.76837158203125e-07, -4.3213367462158203e-07, -3.8743019104003906e-07, -3.427267074584961e-07, -2.980232238769531e-07, -2.5331974029541016e-07, -2.086162567138672e-07, -1.6391277313232422e-07, -1.1920928955078125e-07, -7.450580596923828e-08, -2.9802322387695312e-08, 1.4901161193847656e-08, 5.960464477539063e-08, 1.043081283569336e-07, 1.4901161193847656e-07, 1.9371509552001953e-07, 2.384185791015625e-07, 2.8312206268310547e-07, 3.2782554626464844e-07, 3.725290298461914e-07, 4.172325134277344e-07, 4.6193599700927734e-07, 5.066394805908203e-07, 5.513429641723633e-07, 5.960464477539062e-07, 6.407499313354492e-07, 6.854534149169922e-07, 7.301568984985352e-07, 7.748603820800781e-07, 8.195638656616211e-07, 8.642673492431641e-07, 9.08970832824707e-07, 9.5367431640625e-07, 9.98377799987793e-07, 1.043081283569336e-06, 1.087784767150879e-06, 1.1324882507324219e-06, 1.1771917343139648e-06, 1.2218952178955078e-06, 1.2665987014770508e-06, 1.3113021850585938e-06, 1.3560056686401367e-06, 1.4007091522216797e-06, 1.4454126358032227e-06, 1.4901161193847656e-06]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 5.0, 4.0, 8.0, 12.0, 15.0, 18.0, 32.0, 41.0, 57.0, 66.0, 120.0, 136.0, 244.0, 316.0, 453.0, 699.0, 1017.0, 1537.0, 2330.0, 3719.0, 5726.0, 9531.0, 16165.0, 30421.0, 63867.0, 181973.0, 501439.0, 119535.0, 48724.0, 24310.0, 13723.0, 8055.0, 4930.0, 3204.0, 2096.0, 1354.0, 852.0, 599.0, 377.0, 279.0, 161.0, 123.0, 93.0, 60.0, 33.0, 31.0, 20.0, 17.0, 9.0, 8.0, 5.0, 2.0, 4.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.004497528076171875, -0.004362583160400391, -0.004227638244628906, -0.004092693328857422, -0.0039577484130859375, -0.003822803497314453, -0.0036878585815429688, -0.0035529136657714844, -0.00341796875, -0.0032830238342285156, -0.0031480789184570312, -0.003013134002685547, -0.0028781890869140625, -0.002743244171142578, -0.0026082992553710938, -0.0024733543395996094, -0.002338409423828125, -0.0022034645080566406, -0.0020685195922851562, -0.0019335746765136719, -0.0017986297607421875, -0.0016636848449707031, -0.0015287399291992188, -0.0013937950134277344, -0.00125885009765625, -0.0011239051818847656, -0.0009889602661132812, -0.0008540153503417969, -0.0007190704345703125, -0.0005841255187988281, -0.00044918060302734375, -0.0003142356872558594, -0.000179290771484375, -4.4345855712890625e-05, 9.059906005859375e-05, 0.00022554397583007812, 0.0003604888916015625, 0.0004954338073730469, 0.0006303787231445312, 0.0007653236389160156, 0.0009002685546875, 0.0010352134704589844, 0.0011701583862304688, 0.0013051033020019531, 0.0014400482177734375, 0.0015749931335449219, 0.0017099380493164062, 0.0018448829650878906, 0.001979827880859375, 0.0021147727966308594, 0.0022497177124023438, 0.002384662628173828, 0.0025196075439453125, 0.002654552459716797, 0.0027894973754882812, 0.0029244422912597656, 0.00305938720703125, 0.0031943321228027344, 0.0033292770385742188, 0.003464221954345703, 0.0035991668701171875, 0.003734111785888672, 0.0038690567016601562, 0.004004001617431641, 0.004138946533203125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 0.0, 3.0, 4.0, 4.0, 1.0, 5.0, 2.0, 5.0, 10.0, 10.0, 9.0, 14.0, 16.0, 20.0, 24.0, 26.0, 46.0, 53.0, 92.0, 125.0, 140.0, 101.0, 70.0, 42.0, 44.0, 24.0, 15.0, 15.0, 13.0, 12.0, 11.0, 10.0, 6.0, 6.0, 9.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014562606811523438, -0.0014109760522842407, -0.0013656914234161377, -0.0013204067945480347, -0.0012751221656799316, -0.0012298375368118286, -0.0011845529079437256, -0.0011392682790756226, -0.0010939836502075195, -0.0010486990213394165, -0.0010034143924713135, -0.0009581297636032104, -0.0009128451347351074, -0.0008675605058670044, -0.0008222758769989014, -0.0007769912481307983, -0.0007317066192626953, -0.0006864219903945923, -0.0006411373615264893, -0.0005958527326583862, -0.0005505681037902832, -0.0005052834749221802, -0.00045999884605407715, -0.0004147142171859741, -0.0003694295883178711, -0.00032414495944976807, -0.00027886033058166504, -0.000233575701713562, -0.00018829107284545898, -0.00014300644397735596, -9.772181510925293e-05, -5.24371862411499e-05, -7.152557373046875e-06, 3.813207149505615e-05, 8.341670036315918e-05, 0.0001287013292312622, 0.00017398595809936523, 0.00021927058696746826, 0.0002645552158355713, 0.0003098398447036743, 0.00035512447357177734, 0.00040040910243988037, 0.0004456937313079834, 0.0004909783601760864, 0.0005362629890441895, 0.0005815476179122925, 0.0006268322467803955, 0.0006721168756484985, 0.0007174015045166016, 0.0007626861333847046, 0.0008079707622528076, 0.0008532553911209106, 0.0008985400199890137, 0.0009438246488571167, 0.0009891092777252197, 0.0010343939065933228, 0.0010796785354614258, 0.0011249631643295288, 0.0011702477931976318, 0.0012155324220657349, 0.0012608170509338379, 0.001306101679801941, 0.001351386308670044, 0.001396670937538147, 0.00144195556640625]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 1.0, 0.0, 6.0, 7.0, 3.0, 5.0, 3.0, 11.0, 13.0, 17.0, 17.0, 24.0, 40.0, 35.0, 34.0, 43.0, 83.0, 89.0, 103.0, 93.0, 64.0, 65.0, 45.0, 33.0, 35.0, 28.0, 21.0, 14.0, 11.0, 9.0, 9.0, 6.0, 8.0, 5.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1359325647354126, -0.13135482370853424, -0.12677708268165588, -0.12219933420419693, -0.11762158572673798, -0.11304384469985962, -0.10846610367298126, -0.1038883626461029, -0.09931061416864395, -0.0947328731417656, -0.09015512466430664, -0.08557738363742828, -0.08099964261054993, -0.07642189413309097, -0.07184415310621262, -0.06726640462875366, -0.0626886636018753, -0.05811091884970665, -0.053533174097537994, -0.04895543307065964, -0.04437768831849098, -0.03979994356632233, -0.03522220253944397, -0.030644457787275314, -0.02606671303510666, -0.021488968282938004, -0.016911225393414497, -0.012333481572568417, -0.007755737751722336, -0.0031779929995536804, 0.0013997498899698257, 0.005977492779493332, 0.010555237531661987, 0.015132981352508068, 0.01971072517335415, 0.024288468062877655, 0.02886621281504631, 0.033443957567214966, 0.03802169859409332, 0.04259944334626198, 0.047177188098430634, 0.05175493285059929, 0.056332677602767944, 0.0609104186296463, 0.06548815965652466, 0.07006590813398361, 0.07464364916086197, 0.07922139763832092, 0.08379913866519928, 0.08837687969207764, 0.09295462816953659, 0.09753236919641495, 0.1021101176738739, 0.10668785870075226, 0.11126559972763062, 0.11584334075450897, 0.12042108923196793, 0.12499883025884628, 0.12957657873630524, 0.1341543197631836, 0.13873206079006195, 0.1433098018169403, 0.14788755774497986, 0.15246529877185822, 0.15704303979873657]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 8.0, 9.0, 8.0, 12.0, 15.0, 21.0, 18.0, 22.0, 32.0, 39.0, 30.0, 38.0, 36.0, 47.0, 45.0, 38.0, 54.0, 60.0, 40.0, 44.0, 43.0, 52.0, 43.0, 41.0, 39.0, 40.0, 26.0, 19.0, 8.0, 19.0, 14.0, 14.0, 12.0, 3.0, 5.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11386560648679733, -0.10997967422008514, -0.10609373450279236, -0.10220780223608017, -0.09832186251878738, -0.0944359302520752, -0.09054999053478241, -0.08666405826807022, -0.08277812600135803, -0.07889219373464584, -0.07500625401735306, -0.07112032175064087, -0.06723438203334808, -0.0633484497666359, -0.05946251377463341, -0.05557657778263092, -0.051690638065338135, -0.04780470207333565, -0.04391876608133316, -0.04003283381462097, -0.036146894097328186, -0.032260961830616, -0.02837502583861351, -0.024489089846611023, -0.020603153854608536, -0.01671721786260605, -0.012831282801926136, -0.008945347741246223, -0.005059411749243736, -0.001173475757241249, 0.002712458372116089, 0.006598394364118576, 0.01048433780670166, 0.014370273798704147, 0.018256209790706635, 0.022142143920063972, 0.02602807991206646, 0.029914015904068947, 0.033799950033426285, 0.03768588602542877, 0.04157182201743126, 0.045457758009433746, 0.049343694001436234, 0.05322962999343872, 0.05711556226015091, 0.061001501977443695, 0.06488743424415588, 0.06877337396144867, 0.07265930622816086, 0.07654523849487305, 0.08043117821216583, 0.08431711047887802, 0.0882030501961708, 0.092088982462883, 0.09597492218017578, 0.09986085444688797, 0.10374678671360016, 0.10763271898031235, 0.11151865869760513, 0.11540459096431732, 0.11929053068161011, 0.1231764629483223, 0.12706239521503448, 0.13094833493232727, 0.13483427464962006]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 8.0, 6.0, 7.0, 15.0, 23.0, 49.0, 49.0, 73.0, 127.0, 177.0, 304.0, 471.0, 768.0, 1250.0, 1991.0, 3208.0, 5216.0, 8560.0, 14549.0, 25205.0, 45446.0, 87650.0, 199870.0, 351248.0, 145117.0, 68955.0, 36702.0, 20387.0, 12201.0, 7211.0, 4481.0, 2741.0, 1710.0, 1039.0, 645.0, 389.0, 270.0, 159.0, 94.0, 67.0, 34.0, 35.0, 19.0, 10.0, 12.0, 4.0, 4.0, 6.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.249755859375, -0.24151992797851562, -0.23328399658203125, -0.22504806518554688, -0.2168121337890625, -0.20857620239257812, -0.20034027099609375, -0.19210433959960938, -0.183868408203125, -0.17563247680664062, -0.16739654541015625, -0.15916061401367188, -0.1509246826171875, -0.14268875122070312, -0.13445281982421875, -0.12621688842773438, -0.11798095703125, -0.10974502563476562, -0.10150909423828125, -0.09327316284179688, -0.0850372314453125, -0.07680130004882812, -0.06856536865234375, -0.060329437255859375, -0.052093505859375, -0.043857574462890625, -0.03562164306640625, -0.027385711669921875, -0.0191497802734375, -0.010913848876953125, -0.00267791748046875, 0.005558013916015625, 0.0137939453125, 0.022029876708984375, 0.03026580810546875, 0.038501739501953125, 0.0467376708984375, 0.054973602294921875, 0.06320953369140625, 0.07144546508789062, 0.079681396484375, 0.08791732788085938, 0.09615325927734375, 0.10438919067382812, 0.1126251220703125, 0.12086105346679688, 0.12909698486328125, 0.13733291625976562, 0.14556884765625, 0.15380477905273438, 0.16204071044921875, 0.17027664184570312, 0.1785125732421875, 0.18674850463867188, 0.19498443603515625, 0.20322036743164062, 0.211456298828125, 0.21969223022460938, 0.22792816162109375, 0.23616409301757812, 0.2444000244140625, 0.2526359558105469, 0.26087188720703125, 0.2691078186035156, 0.27734375]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 4.0, 12.0, 12.0, 8.0, 14.0, 11.0, 21.0, 24.0, 29.0, 36.0, 34.0, 31.0, 42.0, 44.0, 35.0, 61.0, 57.0, 53.0, 36.0, 47.0, 43.0, 47.0, 46.0, 40.0, 47.0, 33.0, 21.0, 26.0, 14.0, 8.0, 9.0, 19.0, 11.0, 8.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09503173828125, -0.0915536880493164, -0.08807563781738281, -0.08459758758544922, -0.08111953735351562, -0.07764148712158203, -0.07416343688964844, -0.07068538665771484, -0.06720733642578125, -0.06372928619384766, -0.06025123596191406, -0.05677318572998047, -0.053295135498046875, -0.04981708526611328, -0.04633903503417969, -0.042860984802246094, -0.0393829345703125, -0.035904884338378906, -0.03242683410644531, -0.02894878387451172, -0.025470733642578125, -0.02199268341064453, -0.018514633178710938, -0.015036582946777344, -0.01155853271484375, -0.008080482482910156, -0.0046024322509765625, -0.0011243820190429688, 0.002353668212890625, 0.005831718444824219, 0.009309768676757812, 0.012787818908691406, 0.016265869140625, 0.019743919372558594, 0.023221969604492188, 0.02670001983642578, 0.030178070068359375, 0.03365612030029297, 0.03713417053222656, 0.040612220764160156, 0.04409027099609375, 0.047568321228027344, 0.05104637145996094, 0.05452442169189453, 0.058002471923828125, 0.06148052215576172, 0.06495857238769531, 0.0684366226196289, 0.0719146728515625, 0.0753927230834961, 0.07887077331542969, 0.08234882354736328, 0.08582687377929688, 0.08930492401123047, 0.09278297424316406, 0.09626102447509766, 0.09973907470703125, 0.10321712493896484, 0.10669517517089844, 0.11017322540283203, 0.11365127563476562, 0.11712932586669922, 0.12060737609863281, 0.1240854263305664, 0.1275634765625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 8.0, 6.0, 12.0, 18.0, 32.0, 30.0, 71.0, 112.0, 158.0, 282.0, 390.0, 624.0, 952.0, 1524.0, 2290.0, 3635.0, 5681.0, 8793.0, 13910.0, 22114.0, 36615.0, 61710.0, 111134.0, 236777.0, 257473.0, 117984.0, 64488.0, 38070.0, 23305.0, 14561.0, 9258.0, 5934.0, 3784.0, 2400.0, 1567.0, 1017.0, 667.0, 451.0, 248.0, 176.0, 88.0, 78.0, 39.0, 35.0, 18.0, 14.0, 11.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1962890625, -0.1895313262939453, -0.18277359008789062, -0.17601585388183594, -0.16925811767578125, -0.16250038146972656, -0.15574264526367188, -0.1489849090576172, -0.1422271728515625, -0.1354694366455078, -0.12871170043945312, -0.12195396423339844, -0.11519622802734375, -0.10843849182128906, -0.10168075561523438, -0.09492301940917969, -0.088165283203125, -0.08140754699707031, -0.07464981079101562, -0.06789207458496094, -0.06113433837890625, -0.05437660217285156, -0.047618865966796875, -0.04086112976074219, -0.0341033935546875, -0.027345657348632812, -0.020587921142578125, -0.013830184936523438, -0.00707244873046875, -0.0003147125244140625, 0.006443023681640625, 0.013200759887695312, 0.01995849609375, 0.026716232299804688, 0.033473968505859375, 0.04023170471191406, 0.04698944091796875, 0.05374717712402344, 0.060504913330078125, 0.06726264953613281, 0.0740203857421875, 0.08077812194824219, 0.08753585815429688, 0.09429359436035156, 0.10105133056640625, 0.10780906677246094, 0.11456680297851562, 0.12132453918457031, 0.128082275390625, 0.1348400115966797, 0.14159774780273438, 0.14835548400878906, 0.15511322021484375, 0.16187095642089844, 0.16862869262695312, 0.1753864288330078, 0.1821441650390625, 0.1889019012451172, 0.19565963745117188, 0.20241737365722656, 0.20917510986328125, 0.21593284606933594, 0.22269058227539062, 0.2294483184814453, 0.2362060546875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 11.0, 3.0, 10.0, 12.0, 16.0, 10.0, 21.0, 24.0, 17.0, 26.0, 27.0, 35.0, 52.0, 22.0, 33.0, 41.0, 41.0, 36.0, 35.0, 42.0, 37.0, 39.0, 44.0, 33.0, 42.0, 32.0, 31.0, 34.0, 28.0, 17.0, 26.0, 22.0, 21.0, 10.0, 14.0, 8.0, 10.0, 15.0, 8.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.07391357421875, -0.07198572158813477, -0.07005786895751953, -0.0681300163269043, -0.06620216369628906, -0.06427431106567383, -0.062346458435058594, -0.06041860580444336, -0.058490753173828125, -0.05656290054321289, -0.054635047912597656, -0.05270719528198242, -0.05077934265136719, -0.04885149002075195, -0.04692363739013672, -0.044995784759521484, -0.04306793212890625, -0.041140079498291016, -0.03921222686767578, -0.03728437423706055, -0.03535652160644531, -0.03342866897583008, -0.031500816345214844, -0.02957296371459961, -0.027645111083984375, -0.02571725845336914, -0.023789405822753906, -0.021861553192138672, -0.019933700561523438, -0.018005847930908203, -0.01607799530029297, -0.014150142669677734, -0.0122222900390625, -0.010294437408447266, -0.008366584777832031, -0.006438732147216797, -0.0045108795166015625, -0.002583026885986328, -0.0006551742553710938, 0.0012726783752441406, 0.003200531005859375, 0.005128383636474609, 0.007056236267089844, 0.008984088897705078, 0.010911941528320312, 0.012839794158935547, 0.014767646789550781, 0.016695499420166016, 0.01862335205078125, 0.020551204681396484, 0.02247905731201172, 0.024406909942626953, 0.026334762573242188, 0.028262615203857422, 0.030190467834472656, 0.03211832046508789, 0.034046173095703125, 0.03597402572631836, 0.037901878356933594, 0.03982973098754883, 0.04175758361816406, 0.0436854362487793, 0.04561328887939453, 0.047541141510009766, 0.049468994140625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 4.0, 10.0, 13.0, 12.0, 29.0, 35.0, 41.0, 57.0, 90.0, 139.0, 160.0, 200.0, 309.0, 361.0, 488.0, 751.0, 986.0, 1449.0, 2203.0, 3369.0, 5681.0, 10892.0, 34079.0, 893741.0, 60413.0, 14293.0, 6831.0, 3905.0, 2458.0, 1636.0, 1063.0, 775.0, 504.0, 417.0, 309.0, 207.0, 174.0, 135.0, 90.0, 78.0, 51.0, 34.0, 19.0, 17.0, 14.0, 14.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.0296783447265625, -0.02876901626586914, -0.02785968780517578, -0.026950359344482422, -0.026041030883789062, -0.025131702423095703, -0.024222373962402344, -0.023313045501708984, -0.022403717041015625, -0.021494388580322266, -0.020585060119628906, -0.019675731658935547, -0.018766403198242188, -0.017857074737548828, -0.01694774627685547, -0.01603841781616211, -0.01512908935546875, -0.01421976089477539, -0.013310432434082031, -0.012401103973388672, -0.011491775512695312, -0.010582447052001953, -0.009673118591308594, -0.008763790130615234, -0.007854461669921875, -0.006945133209228516, -0.006035804748535156, -0.005126476287841797, -0.0042171478271484375, -0.003307819366455078, -0.0023984909057617188, -0.0014891624450683594, -0.000579833984375, 0.0003294944763183594, 0.0012388229370117188, 0.002148151397705078, 0.0030574798583984375, 0.003966808319091797, 0.004876136779785156, 0.005785465240478516, 0.006694793701171875, 0.007604122161865234, 0.008513450622558594, 0.009422779083251953, 0.010332107543945312, 0.011241436004638672, 0.012150764465332031, 0.01306009292602539, 0.01396942138671875, 0.01487874984741211, 0.01578807830810547, 0.016697406768798828, 0.017606735229492188, 0.018516063690185547, 0.019425392150878906, 0.020334720611572266, 0.021244049072265625, 0.022153377532958984, 0.023062705993652344, 0.023972034454345703, 0.024881362915039062, 0.025790691375732422, 0.02670001983642578, 0.02760934829711914, 0.0285186767578125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 11.0, 22.0, 30.0, 40.0, 86.0, 99.0, 112.0, 133.0, 135.0, 111.0, 80.0, 56.0, 36.0, 17.0, 11.0, 11.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0728836059570312e-06, -1.0114163160324097e-06, -9.499490261077881e-07, -8.884817361831665e-07, -8.270144462585449e-07, -7.655471563339233e-07, -7.040798664093018e-07, -6.426125764846802e-07, -5.811452865600586e-07, -5.19677996635437e-07, -4.5821070671081543e-07, -3.9674341678619385e-07, -3.3527612686157227e-07, -2.738088369369507e-07, -2.123415470123291e-07, -1.5087425708770752e-07, -8.940696716308594e-08, -2.7939677238464355e-08, 3.3527612686157227e-08, 9.499490261077881e-08, 1.564621925354004e-07, 2.1792948246002197e-07, 2.7939677238464355e-07, 3.4086406230926514e-07, 4.023313522338867e-07, 4.637986421585083e-07, 5.252659320831299e-07, 5.867332220077515e-07, 6.48200511932373e-07, 7.096678018569946e-07, 7.711350917816162e-07, 8.326023817062378e-07, 8.940696716308594e-07, 9.55536961555481e-07, 1.0170042514801025e-06, 1.0784715414047241e-06, 1.1399388313293457e-06, 1.2014061212539673e-06, 1.2628734111785889e-06, 1.3243407011032104e-06, 1.385807991027832e-06, 1.4472752809524536e-06, 1.5087425708770752e-06, 1.5702098608016968e-06, 1.6316771507263184e-06, 1.69314444065094e-06, 1.7546117305755615e-06, 1.816079020500183e-06, 1.8775463104248047e-06, 1.9390136003494263e-06, 2.000480890274048e-06, 2.0619481801986694e-06, 2.123415470123291e-06, 2.1848827600479126e-06, 2.246350049972534e-06, 2.3078173398971558e-06, 2.3692846298217773e-06, 2.430751919746399e-06, 2.4922192096710205e-06, 2.553686499595642e-06, 2.6151537895202637e-06, 2.6766210794448853e-06, 2.738088369369507e-06, 2.7995556592941284e-06, 2.86102294921875e-06]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 7.0, 7.0, 13.0, 19.0, 21.0, 46.0, 68.0, 82.0, 114.0, 206.0, 306.0, 419.0, 638.0, 953.0, 1450.0, 2255.0, 3581.0, 6390.0, 14851.0, 131326.0, 847556.0, 19264.0, 7637.0, 4060.0, 2495.0, 1563.0, 1055.0, 719.0, 482.0, 293.0, 211.0, 146.0, 101.0, 67.0, 47.0, 31.0, 26.0, 18.0, 6.0, 9.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03411865234375, -0.032985687255859375, -0.03185272216796875, -0.030719757080078125, -0.0295867919921875, -0.028453826904296875, -0.02732086181640625, -0.026187896728515625, -0.025054931640625, -0.023921966552734375, -0.02278900146484375, -0.021656036376953125, -0.0205230712890625, -0.019390106201171875, -0.01825714111328125, -0.017124176025390625, -0.0159912109375, -0.014858245849609375, -0.01372528076171875, -0.012592315673828125, -0.0114593505859375, -0.010326385498046875, -0.00919342041015625, -0.008060455322265625, -0.006927490234375, -0.005794525146484375, -0.00466156005859375, -0.003528594970703125, -0.0023956298828125, -0.001262664794921875, -0.00012969970703125, 0.001003265380859375, 0.00213623046875, 0.003269195556640625, 0.00440216064453125, 0.005535125732421875, 0.0066680908203125, 0.007801055908203125, 0.00893402099609375, 0.010066986083984375, 0.011199951171875, 0.012332916259765625, 0.01346588134765625, 0.014598846435546875, 0.0157318115234375, 0.016864776611328125, 0.01799774169921875, 0.019130706787109375, 0.020263671875, 0.021396636962890625, 0.02252960205078125, 0.023662567138671875, 0.0247955322265625, 0.025928497314453125, 0.02706146240234375, 0.028194427490234375, 0.029327392578125, 0.030460357666015625, 0.03159332275390625, 0.032726287841796875, 0.0338592529296875, 0.034992218017578125, 0.03612518310546875, 0.037258148193359375, 0.03839111328125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 5.0, 12.0, 14.0, 16.0, 50.0, 545.0, 230.0, 50.0, 15.0, 8.0, 9.0, 4.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00922393798828125, -0.008951544761657715, -0.00867915153503418, -0.008406758308410645, -0.00813436508178711, -0.007861971855163574, -0.007589578628540039, -0.007317185401916504, -0.007044792175292969, -0.006772398948669434, -0.0065000057220458984, -0.006227612495422363, -0.005955219268798828, -0.005682826042175293, -0.005410432815551758, -0.005138039588928223, -0.0048656463623046875, -0.004593253135681152, -0.004320859909057617, -0.004048466682434082, -0.003776073455810547, -0.0035036802291870117, -0.0032312870025634766, -0.0029588937759399414, -0.0026865005493164062, -0.002414107322692871, -0.002141714096069336, -0.0018693208694458008, -0.0015969276428222656, -0.0013245344161987305, -0.0010521411895751953, -0.0007797479629516602, -0.000507354736328125, -0.00023496150970458984, 3.743171691894531e-05, 0.00030982494354248047, 0.0005822181701660156, 0.0008546113967895508, 0.001127004623413086, 0.001399397850036621, 0.0016717910766601562, 0.0019441843032836914, 0.0022165775299072266, 0.0024889707565307617, 0.002761363983154297, 0.003033757209777832, 0.003306150436401367, 0.0035785436630249023, 0.0038509368896484375, 0.004123330116271973, 0.004395723342895508, 0.004668116569519043, 0.004940509796142578, 0.005212903022766113, 0.0054852962493896484, 0.005757689476013184, 0.006030082702636719, 0.006302475929260254, 0.006574869155883789, 0.006847262382507324, 0.007119655609130859, 0.0073920488357543945, 0.00766444206237793, 0.007936835289001465, 0.008209228515625]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 3.0, 3.0, 12.0, 10.0, 13.0, 20.0, 22.0, 37.0, 44.0, 43.0, 57.0, 93.0, 111.0, 117.0, 91.0, 66.0, 55.0, 39.0, 29.0, 26.0, 20.0, 21.0, 9.0, 13.0, 6.0, 8.0, 7.0, 4.0, 2.0, 2.0, 6.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1380511373281479, -0.13332794606685638, -0.12860475480556488, -0.12388155609369278, -0.11915835738182068, -0.11443516612052917, -0.10971197485923767, -0.10498878359794617, -0.10026558488607407, -0.09554239362478256, -0.09081919491291046, -0.08609600365161896, -0.08137281239032745, -0.07664961367845535, -0.07192642241716385, -0.06720322370529175, -0.062480032444000244, -0.05775683745741844, -0.05303364247083664, -0.048310451209545135, -0.04358725622296333, -0.03886406123638153, -0.03414086997509003, -0.029417674988508224, -0.024694480001926422, -0.01997128501534462, -0.015248091891407967, -0.010524897836148739, -0.005801703780889511, -0.0010785087943077087, 0.0036446843296289444, 0.008367877453565598, 0.0130910724401474, 0.017814267426729202, 0.022537460550665855, 0.02726065367460251, 0.03198384866118431, 0.03670704364776611, 0.04143023490905762, 0.04615342989563942, 0.05087662488222122, 0.055599819868803024, 0.06032301485538483, 0.06504620611667633, 0.06976939737796783, 0.07449259608983994, 0.07921578735113144, 0.08393898606300354, 0.08866217732429504, 0.09338536858558655, 0.09810856729745865, 0.10283175855875015, 0.10755495727062225, 0.11227814853191376, 0.11700133979320526, 0.12172453105449677, 0.12644773721694946, 0.13117092847824097, 0.13589411973953247, 0.14061732590198517, 0.14534051716327667, 0.15006370842456818, 0.15478689968585968, 0.15951009094715118, 0.1642332822084427]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 3.0, 4.0, 3.0, 9.0, 11.0, 8.0, 11.0, 15.0, 17.0, 23.0, 23.0, 32.0, 31.0, 24.0, 36.0, 42.0, 45.0, 61.0, 44.0, 52.0, 43.0, 33.0, 48.0, 41.0, 58.0, 42.0, 35.0, 38.0, 33.0, 31.0, 19.0, 22.0, 16.0, 22.0, 10.0, 10.0, 4.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09458854049444199, -0.09098723530769348, -0.08738593757152557, -0.08378463238477707, -0.08018332719802856, -0.07658202946186066, -0.07298072427511215, -0.06937941908836365, -0.06577812135219574, -0.062176819890737534, -0.05857551842927933, -0.05497421324253082, -0.05137291178107262, -0.04777161031961441, -0.044170305132865906, -0.0405690036714077, -0.03696770220994949, -0.03336640074849129, -0.029765097424387932, -0.026163794100284576, -0.02256249263882637, -0.018961191177368164, -0.015359887853264809, -0.011758584529161453, -0.008157283067703247, -0.004555980674922466, -0.0009546782821416855, 0.0026466241106390953, 0.006247926503419876, 0.009849227964878082, 0.013450531288981438, 0.017051834613084793, 0.020653143525123596, 0.024254444986581802, 0.027855748310685158, 0.03145705163478851, 0.03505835309624672, 0.038659654557704926, 0.04226095974445343, 0.045862261205911636, 0.04946356266736984, 0.05306486412882805, 0.056666165590286255, 0.06026747077703476, 0.06386877596378326, 0.06747007369995117, 0.07107137888669968, 0.07467268407344818, 0.07827398180961609, 0.0818752869963646, 0.0854765847325325, 0.089077889919281, 0.09267918765544891, 0.09628049284219742, 0.09988179802894592, 0.10348309576511383, 0.10708440095186234, 0.11068570613861084, 0.11428700387477875, 0.11788830906152725, 0.12148961424827576, 0.12509091198444366, 0.12869220972061157, 0.13229352235794067, 0.13589482009410858]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 5.0, 8.0, 10.0, 19.0, 31.0, 46.0, 64.0, 99.0, 117.0, 220.0, 283.0, 414.0, 635.0, 966.0, 1294.0, 1845.0, 2832.0, 4246.0, 6558.0, 10360.0, 16469.0, 28152.0, 50503.0, 100449.0, 232974.0, 961601.0, 1968558.0, 476034.0, 157268.0, 73390.0, 38818.0, 22452.0, 13431.0, 8341.0, 5264.0, 3423.0, 2213.0, 1533.0, 1044.0, 713.0, 481.0, 347.0, 223.0, 159.0, 94.0, 78.0, 45.0, 50.0, 28.0, 17.0, 10.0, 23.0, 15.0, 13.0, 7.0, 10.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0], "bins": [-0.1318359375, -0.12700271606445312, -0.12216949462890625, -0.11733627319335938, -0.1125030517578125, -0.10766983032226562, -0.10283660888671875, -0.09800338745117188, -0.093170166015625, -0.08833694458007812, -0.08350372314453125, -0.07867050170898438, -0.0738372802734375, -0.06900405883789062, -0.06417083740234375, -0.059337615966796875, -0.05450439453125, -0.049671173095703125, -0.04483795166015625, -0.040004730224609375, -0.0351715087890625, -0.030338287353515625, -0.02550506591796875, -0.020671844482421875, -0.015838623046875, -0.011005401611328125, -0.00617218017578125, -0.001338958740234375, 0.0034942626953125, 0.008327484130859375, 0.01316070556640625, 0.017993927001953125, 0.0228271484375, 0.027660369873046875, 0.03249359130859375, 0.037326812744140625, 0.0421600341796875, 0.046993255615234375, 0.05182647705078125, 0.056659698486328125, 0.061492919921875, 0.06632614135742188, 0.07115936279296875, 0.07599258422851562, 0.0808258056640625, 0.08565902709960938, 0.09049224853515625, 0.09532546997070312, 0.10015869140625, 0.10499191284179688, 0.10982513427734375, 0.11465835571289062, 0.1194915771484375, 0.12432479858398438, 0.12915802001953125, 0.13399124145507812, 0.138824462890625, 0.14365768432617188, 0.14849090576171875, 0.15332412719726562, 0.1581573486328125, 0.16299057006835938, 0.16782379150390625, 0.17265701293945312, 0.177490234375]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 6.0, 8.0, 15.0, 10.0, 18.0, 24.0, 21.0, 21.0, 32.0, 28.0, 40.0, 46.0, 54.0, 61.0, 50.0, 45.0, 62.0, 44.0, 49.0, 55.0, 59.0, 34.0, 32.0, 37.0, 31.0, 21.0, 22.0, 17.0, 14.0, 19.0, 11.0, 6.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06268310546875, -0.06036567687988281, -0.058048248291015625, -0.05573081970214844, -0.05341339111328125, -0.05109596252441406, -0.048778533935546875, -0.04646110534667969, -0.0441436767578125, -0.04182624816894531, -0.039508819580078125, -0.03719139099121094, -0.03487396240234375, -0.03255653381347656, -0.030239105224609375, -0.027921676635742188, -0.025604248046875, -0.023286819458007812, -0.020969390869140625, -0.018651962280273438, -0.01633453369140625, -0.014017105102539062, -0.011699676513671875, -0.009382247924804688, -0.0070648193359375, -0.0047473907470703125, -0.002429962158203125, -0.0001125335693359375, 0.00220489501953125, 0.0045223236083984375, 0.006839752197265625, 0.009157180786132812, 0.011474609375, 0.013792037963867188, 0.016109466552734375, 0.018426895141601562, 0.02074432373046875, 0.023061752319335938, 0.025379180908203125, 0.027696609497070312, 0.0300140380859375, 0.03233146667480469, 0.034648895263671875, 0.03696632385253906, 0.03928375244140625, 0.04160118103027344, 0.043918609619140625, 0.04623603820800781, 0.048553466796875, 0.05087089538574219, 0.053188323974609375, 0.05550575256347656, 0.05782318115234375, 0.06014060974121094, 0.062458038330078125, 0.06477546691894531, 0.0670928955078125, 0.06941032409667969, 0.07172775268554688, 0.07404518127441406, 0.07636260986328125, 0.07868003845214844, 0.08099746704101562, 0.08331489562988281, 0.08563232421875]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 7.0, 9.0, 7.0, 7.0, 14.0, 32.0, 38.0, 46.0, 82.0, 78.0, 157.0, 213.0, 319.0, 469.0, 674.0, 945.0, 1401.0, 2062.0, 3207.0, 4919.0, 7559.0, 12019.0, 20197.0, 34375.0, 62516.0, 120583.0, 253349.0, 642844.0, 1758697.0, 708388.0, 272538.0, 127618.0, 66476.0, 36053.0, 20717.0, 12698.0, 7861.0, 5097.0, 3172.0, 2133.0, 1555.0, 972.0, 628.0, 466.0, 318.0, 214.0, 181.0, 131.0, 79.0, 49.0, 35.0, 31.0, 22.0, 12.0, 11.0, 11.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1068115234375, -0.10331439971923828, -0.09981727600097656, -0.09632015228271484, -0.09282302856445312, -0.0893259048461914, -0.08582878112792969, -0.08233165740966797, -0.07883453369140625, -0.07533740997314453, -0.07184028625488281, -0.0683431625366211, -0.06484603881835938, -0.061348915100097656, -0.05785179138183594, -0.05435466766357422, -0.0508575439453125, -0.04736042022705078, -0.04386329650878906, -0.040366172790527344, -0.036869049072265625, -0.033371925354003906, -0.029874801635742188, -0.02637767791748047, -0.02288055419921875, -0.01938343048095703, -0.015886306762695312, -0.012389183044433594, -0.008892059326171875, -0.005394935607910156, -0.0018978118896484375, 0.0015993118286132812, 0.005096435546875, 0.008593559265136719, 0.012090682983398438, 0.015587806701660156, 0.019084930419921875, 0.022582054138183594, 0.026079177856445312, 0.02957630157470703, 0.03307342529296875, 0.03657054901123047, 0.04006767272949219, 0.043564796447753906, 0.047061920166015625, 0.050559043884277344, 0.05405616760253906, 0.05755329132080078, 0.0610504150390625, 0.06454753875732422, 0.06804466247558594, 0.07154178619384766, 0.07503890991210938, 0.0785360336303711, 0.08203315734863281, 0.08553028106689453, 0.08902740478515625, 0.09252452850341797, 0.09602165222167969, 0.0995187759399414, 0.10301589965820312, 0.10651302337646484, 0.11001014709472656, 0.11350727081298828, 0.11700439453125]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 0.0, 2.0, 7.0, 5.0, 6.0, 5.0, 10.0, 9.0, 8.0, 19.0, 18.0, 31.0, 42.0, 32.0, 37.0, 47.0, 56.0, 74.0, 95.0, 103.0, 143.0, 174.0, 173.0, 246.0, 255.0, 253.0, 326.0, 323.0, 256.0, 205.0, 186.0, 147.0, 132.0, 113.0, 100.0, 80.0, 65.0, 51.0, 36.0, 39.0, 40.0, 22.0, 24.0, 14.0, 11.0, 7.0, 14.0, 8.0, 10.0, 5.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0, 3.0], "bins": [-0.030853271484375, -0.029905080795288086, -0.028956890106201172, -0.028008699417114258, -0.027060508728027344, -0.02611231803894043, -0.025164127349853516, -0.0242159366607666, -0.023267745971679688, -0.022319555282592773, -0.02137136459350586, -0.020423173904418945, -0.01947498321533203, -0.018526792526245117, -0.017578601837158203, -0.01663041114807129, -0.015682220458984375, -0.014734029769897461, -0.013785839080810547, -0.012837648391723633, -0.011889457702636719, -0.010941267013549805, -0.00999307632446289, -0.009044885635375977, -0.008096694946289062, -0.0071485042572021484, -0.006200313568115234, -0.00525212287902832, -0.004303932189941406, -0.003355741500854492, -0.002407550811767578, -0.001459360122680664, -0.00051116943359375, 0.00043702125549316406, 0.0013852119445800781, 0.002333402633666992, 0.0032815933227539062, 0.00422978401184082, 0.005177974700927734, 0.0061261653900146484, 0.0070743560791015625, 0.008022546768188477, 0.00897073745727539, 0.009918928146362305, 0.010867118835449219, 0.011815309524536133, 0.012763500213623047, 0.013711690902709961, 0.014659881591796875, 0.015608072280883789, 0.016556262969970703, 0.017504453659057617, 0.01845264434814453, 0.019400835037231445, 0.02034902572631836, 0.021297216415405273, 0.022245407104492188, 0.0231935977935791, 0.024141788482666016, 0.02508997917175293, 0.026038169860839844, 0.026986360549926758, 0.027934551239013672, 0.028882741928100586, 0.0298309326171875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 6.0, 7.0, 8.0, 6.0, 19.0, 16.0, 14.0, 16.0, 41.0, 28.0, 41.0, 72.0, 73.0, 106.0, 113.0, 85.0, 78.0, 62.0, 36.0, 31.0, 26.0, 19.0, 21.0, 16.0, 15.0, 8.0, 15.0, 2.0, 4.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.09816417843103409, -0.0953189954161644, -0.09247381240129471, -0.08962863683700562, -0.08678345382213593, -0.08393827080726624, -0.08109308779239655, -0.07824790477752686, -0.07540272176265717, -0.07255753874778748, -0.06971235573291779, -0.0668671727180481, -0.064021997153759, -0.06117681413888931, -0.05833163112401962, -0.05548644810914993, -0.05264127254486084, -0.04979608952999115, -0.04695091024041176, -0.04410572722554207, -0.04126054793596268, -0.03841536492109299, -0.0355701819062233, -0.03272499889135361, -0.029879819601774216, -0.027034638449549675, -0.024189457297325134, -0.021344274282455444, -0.018499093130230904, -0.015653911978006363, -0.012808728963136673, -0.009963547810912132, -0.007118359208106995, -0.004273177590221167, -0.0014279959723353386, 0.0014171861112117767, 0.0042623672634363174, 0.007107548415660858, 0.009952731430530548, 0.012797912582755089, 0.01564309373497963, 0.01848827488720417, 0.02133345603942871, 0.0241786390542984, 0.02702382020652294, 0.029869001358747482, 0.03271418437361717, 0.035559363663196564, 0.038404546678066254, 0.041249729692935944, 0.044094908982515335, 0.046940091997385025, 0.049785271286964417, 0.052630454301834106, 0.055475637316703796, 0.058320820331573486, 0.06116599962115288, 0.06401117891073227, 0.06685636192560196, 0.06970154494047165, 0.07254672795534134, 0.07539190351963043, 0.07823708653450012, 0.08108226954936981, 0.0839274525642395]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 0.0, 3.0, 5.0, 6.0, 7.0, 11.0, 10.0, 12.0, 18.0, 18.0, 23.0, 31.0, 32.0, 37.0, 42.0, 40.0, 34.0, 33.0, 49.0, 54.0, 42.0, 57.0, 45.0, 36.0, 52.0, 42.0, 52.0, 32.0, 28.0, 33.0, 17.0, 18.0, 15.0, 17.0, 10.0, 12.0, 10.0, 7.0, 10.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06254863739013672, -0.06028264760971069, -0.05801665410399437, -0.055750660598278046, -0.05348467081785202, -0.051218681037425995, -0.04895268753170967, -0.04668669402599335, -0.04442070424556732, -0.042154714465141296, -0.03988872095942497, -0.03762272745370865, -0.03535673767328262, -0.0330907478928566, -0.030824754387140274, -0.0285587627440691, -0.026292771100997925, -0.02402677945792675, -0.021760787814855576, -0.0194947961717844, -0.017228804528713226, -0.014962812885642052, -0.012696821242570877, -0.010430829599499702, -0.008164837956428528, -0.005898846313357353, -0.0036328546702861786, -0.001366863027215004, 0.0008991286158561707, 0.0031651202589273453, 0.00543111190199852, 0.0076971035450696945, 0.009963102638721466, 0.01222909428179264, 0.014495085924863815, 0.01676107756793499, 0.019027069211006165, 0.02129306085407734, 0.023559052497148514, 0.02582504414021969, 0.028091035783290863, 0.030357027426362038, 0.03262301906943321, 0.034889012575149536, 0.03715500235557556, 0.03942099213600159, 0.04168698564171791, 0.043952979147434235, 0.04621896892786026, 0.048484958708286285, 0.05075095221400261, 0.05301694571971893, 0.05528293550014496, 0.057548925280570984, 0.05981491878628731, 0.06208091229200363, 0.06434690207242966, 0.06661289185285568, 0.0688788890838623, 0.07114487886428833, 0.07341086864471436, 0.07567685842514038, 0.0779428482055664, 0.08020884543657303, 0.08247483521699905]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 8.0, 10.0, 14.0, 20.0, 23.0, 37.0, 51.0, 104.0, 155.0, 235.0, 366.0, 577.0, 892.0, 1492.0, 2294.0, 4053.0, 6626.0, 11185.0, 19974.0, 36891.0, 72892.0, 175878.0, 397215.0, 165773.0, 69928.0, 35237.0, 19117.0, 10921.0, 6416.0, 3871.0, 2338.0, 1458.0, 931.0, 571.0, 337.0, 209.0, 162.0, 95.0, 74.0, 46.0, 29.0, 19.0, 12.0, 6.0, 7.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0284576416015625, -0.027655363082885742, -0.026853084564208984, -0.026050806045532227, -0.02524852752685547, -0.02444624900817871, -0.023643970489501953, -0.022841691970825195, -0.022039413452148438, -0.02123713493347168, -0.020434856414794922, -0.019632577896118164, -0.018830299377441406, -0.01802802085876465, -0.01722574234008789, -0.016423463821411133, -0.015621185302734375, -0.014818906784057617, -0.01401662826538086, -0.013214349746704102, -0.012412071228027344, -0.011609792709350586, -0.010807514190673828, -0.01000523567199707, -0.009202957153320312, -0.008400678634643555, -0.007598400115966797, -0.006796121597290039, -0.005993843078613281, -0.0051915645599365234, -0.004389286041259766, -0.003587007522583008, -0.00278472900390625, -0.001982450485229492, -0.0011801719665527344, -0.00037789344787597656, 0.00042438507080078125, 0.001226663589477539, 0.002028942108154297, 0.0028312206268310547, 0.0036334991455078125, 0.00443577766418457, 0.005238056182861328, 0.006040334701538086, 0.006842613220214844, 0.0076448917388916016, 0.00844717025756836, 0.009249448776245117, 0.010051727294921875, 0.010854005813598633, 0.01165628433227539, 0.012458562850952148, 0.013260841369628906, 0.014063119888305664, 0.014865398406982422, 0.01566767692565918, 0.016469955444335938, 0.017272233963012695, 0.018074512481689453, 0.01887679100036621, 0.01967906951904297, 0.020481348037719727, 0.021283626556396484, 0.022085905075073242, 0.02288818359375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 7.0, 3.0, 14.0, 14.0, 10.0, 18.0, 27.0, 24.0, 35.0, 28.0, 38.0, 37.0, 29.0, 34.0, 52.0, 62.0, 51.0, 51.0, 65.0, 46.0, 51.0, 50.0, 45.0, 38.0, 28.0, 27.0, 15.0, 14.0, 22.0, 14.0, 10.0, 10.0, 5.0, 6.0, 6.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0689697265625, -0.06649112701416016, -0.06401252746582031, -0.06153392791748047, -0.059055328369140625, -0.05657672882080078, -0.05409812927246094, -0.051619529724121094, -0.04914093017578125, -0.046662330627441406, -0.04418373107910156, -0.04170513153076172, -0.039226531982421875, -0.03674793243408203, -0.03426933288574219, -0.031790733337402344, -0.0293121337890625, -0.026833534240722656, -0.024354934692382812, -0.02187633514404297, -0.019397735595703125, -0.01691913604736328, -0.014440536499023438, -0.011961936950683594, -0.00948333740234375, -0.007004737854003906, -0.0045261383056640625, -0.0020475387573242188, 0.000431060791015625, 0.0029096603393554688, 0.0053882598876953125, 0.007866859436035156, 0.010345458984375, 0.012824058532714844, 0.015302658081054688, 0.01778125762939453, 0.020259857177734375, 0.02273845672607422, 0.025217056274414062, 0.027695655822753906, 0.03017425537109375, 0.032652854919433594, 0.03513145446777344, 0.03761005401611328, 0.040088653564453125, 0.04256725311279297, 0.04504585266113281, 0.047524452209472656, 0.0500030517578125, 0.052481651306152344, 0.05496025085449219, 0.05743885040283203, 0.059917449951171875, 0.06239604949951172, 0.06487464904785156, 0.0673532485961914, 0.06983184814453125, 0.0723104476928711, 0.07478904724121094, 0.07726764678955078, 0.07974624633789062, 0.08222484588623047, 0.08470344543457031, 0.08718204498291016, 0.08966064453125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 1.0, 4.0, 3.0, 7.0, 12.0, 16.0, 8.0, 19.0, 35.0, 31.0, 73.0, 69.0, 116.0, 151.0, 228.0, 297.0, 449.0, 622.0, 1003.0, 1511.0, 2461.0, 3898.0, 6017.0, 10242.0, 17517.0, 32462.0, 65809.0, 163455.0, 434173.0, 163802.0, 66470.0, 32382.0, 17899.0, 10246.0, 6195.0, 3726.0, 2379.0, 1591.0, 1001.0, 683.0, 471.0, 314.0, 218.0, 167.0, 84.0, 74.0, 61.0, 26.0, 20.0, 17.0, 20.0, 12.0, 3.0, 8.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.0289764404296875, -0.028056621551513672, -0.027136802673339844, -0.026216983795166016, -0.025297164916992188, -0.02437734603881836, -0.02345752716064453, -0.022537708282470703, -0.021617889404296875, -0.020698070526123047, -0.01977825164794922, -0.01885843276977539, -0.017938613891601562, -0.017018795013427734, -0.016098976135253906, -0.015179157257080078, -0.01425933837890625, -0.013339519500732422, -0.012419700622558594, -0.011499881744384766, -0.010580062866210938, -0.00966024398803711, -0.008740425109863281, -0.007820606231689453, -0.006900787353515625, -0.005980968475341797, -0.005061149597167969, -0.004141330718994141, -0.0032215118408203125, -0.0023016929626464844, -0.0013818740844726562, -0.0004620552062988281, 0.000457763671875, 0.0013775825500488281, 0.0022974014282226562, 0.0032172203063964844, 0.0041370391845703125, 0.005056858062744141, 0.005976676940917969, 0.006896495819091797, 0.007816314697265625, 0.008736133575439453, 0.009655952453613281, 0.01057577133178711, 0.011495590209960938, 0.012415409088134766, 0.013335227966308594, 0.014255046844482422, 0.01517486572265625, 0.016094684600830078, 0.017014503479003906, 0.017934322357177734, 0.018854141235351562, 0.01977396011352539, 0.02069377899169922, 0.021613597869873047, 0.022533416748046875, 0.023453235626220703, 0.02437305450439453, 0.02529287338256836, 0.026212692260742188, 0.027132511138916016, 0.028052330017089844, 0.028972148895263672, 0.0298919677734375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 12.0, 3.0, 6.0, 12.0, 12.0, 10.0, 12.0, 21.0, 15.0, 27.0, 26.0, 22.0, 28.0, 43.0, 32.0, 45.0, 31.0, 36.0, 37.0, 34.0, 38.0, 43.0, 39.0, 40.0, 42.0, 32.0, 39.0, 36.0, 36.0, 25.0, 26.0, 22.0, 21.0, 15.0, 19.0, 16.0, 11.0, 4.0, 9.0, 5.0, 5.0, 5.0, 2.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.042022705078125, -0.040728092193603516, -0.03943347930908203, -0.03813886642456055, -0.03684425354003906, -0.03554964065551758, -0.034255027770996094, -0.03296041488647461, -0.031665802001953125, -0.03037118911743164, -0.029076576232910156, -0.027781963348388672, -0.026487350463867188, -0.025192737579345703, -0.02389812469482422, -0.022603511810302734, -0.02130889892578125, -0.020014286041259766, -0.01871967315673828, -0.017425060272216797, -0.016130447387695312, -0.014835834503173828, -0.013541221618652344, -0.01224660873413086, -0.010951995849609375, -0.00965738296508789, -0.008362770080566406, -0.007068157196044922, -0.0057735443115234375, -0.004478931427001953, -0.0031843185424804688, -0.0018897056579589844, -0.0005950927734375, 0.0006995201110839844, 0.0019941329956054688, 0.003288745880126953, 0.0045833587646484375, 0.005877971649169922, 0.007172584533691406, 0.00846719741821289, 0.009761810302734375, 0.01105642318725586, 0.012351036071777344, 0.013645648956298828, 0.014940261840820312, 0.016234874725341797, 0.01752948760986328, 0.018824100494384766, 0.02011871337890625, 0.021413326263427734, 0.02270793914794922, 0.024002552032470703, 0.025297164916992188, 0.026591777801513672, 0.027886390686035156, 0.02918100357055664, 0.030475616455078125, 0.03177022933959961, 0.033064842224121094, 0.03435945510864258, 0.03565406799316406, 0.03694868087768555, 0.03824329376220703, 0.039537906646728516, 0.04083251953125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 9.0, 9.0, 14.0, 20.0, 26.0, 37.0, 54.0, 62.0, 71.0, 127.0, 196.0, 247.0, 383.0, 522.0, 769.0, 1171.0, 1723.0, 2866.0, 4723.0, 8272.0, 15254.0, 31026.0, 76035.0, 479571.0, 297958.0, 65676.0, 27714.0, 14035.0, 7617.0, 4496.0, 2714.0, 1669.0, 1121.0, 731.0, 465.0, 316.0, 238.0, 159.0, 124.0, 89.0, 59.0, 49.0, 34.0, 28.0, 23.0, 10.0, 12.0, 6.0, 8.0, 5.0, 3.0, 2.0, 2.0], "bins": [-0.0031280517578125, -0.0030384957790374756, -0.002948939800262451, -0.0028593838214874268, -0.0027698278427124023, -0.002680271863937378, -0.0025907158851623535, -0.002501159906387329, -0.0024116039276123047, -0.0023220479488372803, -0.002232491970062256, -0.0021429359912872314, -0.002053380012512207, -0.0019638240337371826, -0.0018742680549621582, -0.0017847120761871338, -0.0016951560974121094, -0.001605600118637085, -0.0015160441398620605, -0.0014264881610870361, -0.0013369321823120117, -0.0012473762035369873, -0.0011578202247619629, -0.0010682642459869385, -0.000978708267211914, -0.0008891522884368896, -0.0007995963096618652, -0.0007100403308868408, -0.0006204843521118164, -0.000530928373336792, -0.0004413723945617676, -0.00035181641578674316, -0.00026226043701171875, -0.00017270445823669434, -8.314847946166992e-05, 6.407499313354492e-06, 9.59634780883789e-05, 0.00018551945686340332, 0.00027507543563842773, 0.00036463141441345215, 0.00045418739318847656, 0.000543743371963501, 0.0006332993507385254, 0.0007228553295135498, 0.0008124113082885742, 0.0009019672870635986, 0.000991523265838623, 0.0010810792446136475, 0.0011706352233886719, 0.0012601912021636963, 0.0013497471809387207, 0.0014393031597137451, 0.0015288591384887695, 0.001618415117263794, 0.0017079710960388184, 0.0017975270748138428, 0.0018870830535888672, 0.0019766390323638916, 0.002066195011138916, 0.0021557509899139404, 0.002245306968688965, 0.0023348629474639893, 0.0024244189262390137, 0.002513974905014038, 0.0026035308837890625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 0.0, 1.0, 7.0, 13.0, 11.0, 15.0, 19.0, 29.0, 0.0, 36.0, 53.0, 56.0, 67.0, 85.0, 81.0, 82.0, 88.0, 92.0, 75.0, 44.0, 30.0, 0.0, 35.0, 25.0, 19.0, 5.0, 8.0, 9.0, 4.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7881393432617188e-06, -1.7331913113594055e-06, -1.6782432794570923e-06, -1.623295247554779e-06, -1.5683472156524658e-06, -1.5133991837501526e-06, -1.4584511518478394e-06, -1.4035031199455261e-06, -1.3485550880432129e-06, -1.2936070561408997e-06, -1.2386590242385864e-06, -1.1837109923362732e-06, -1.12876296043396e-06, -1.0738149285316467e-06, -1.0188668966293335e-06, -9.639188647270203e-07, -9.08970832824707e-07, -8.540228009223938e-07, -7.990747690200806e-07, -7.441267371177673e-07, -6.891787052154541e-07, -6.342306733131409e-07, -5.792826414108276e-07, -5.243346095085144e-07, -4.6938657760620117e-07, -4.1443854570388794e-07, -3.594905138015747e-07, -3.045424818992615e-07, -2.4959444999694824e-07, -1.94646418094635e-07, -1.3969838619232178e-07, -8.475035429000854e-08, -2.9802322387695312e-08, 2.514570951461792e-08, 8.009374141693115e-08, 1.3504177331924438e-07, 1.8998980522155762e-07, 2.4493783712387085e-07, 2.998858690261841e-07, 3.548339009284973e-07, 4.0978193283081055e-07, 4.647299647331238e-07, 5.19677996635437e-07, 5.746260285377502e-07, 6.295740604400635e-07, 6.845220923423767e-07, 7.394701242446899e-07, 7.944181561470032e-07, 8.493661880493164e-07, 9.043142199516296e-07, 9.592622518539429e-07, 1.014210283756256e-06, 1.0691583156585693e-06, 1.1241063475608826e-06, 1.1790543794631958e-06, 1.234002411365509e-06, 1.2889504432678223e-06, 1.3438984751701355e-06, 1.3988465070724487e-06, 1.453794538974762e-06, 1.5087425708770752e-06, 1.5636906027793884e-06, 1.6186386346817017e-06, 1.6735866665840149e-06, 1.7285346984863281e-06]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 7.0, 10.0, 12.0, 13.0, 25.0, 41.0, 38.0, 77.0, 90.0, 134.0, 195.0, 303.0, 426.0, 664.0, 1019.0, 1564.0, 2642.0, 4303.0, 7314.0, 13206.0, 25582.0, 57117.0, 174486.0, 552174.0, 115996.0, 43536.0, 20578.0, 10955.0, 6126.0, 3658.0, 2226.0, 1392.0, 837.0, 553.0, 400.0, 272.0, 167.0, 119.0, 90.0, 58.0, 43.0, 27.0, 25.0, 13.0, 20.0, 8.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.00354766845703125, -0.0034412741661071777, -0.0033348798751831055, -0.003228485584259033, -0.003122091293334961, -0.0030156970024108887, -0.0029093027114868164, -0.002802908420562744, -0.002696514129638672, -0.0025901198387145996, -0.0024837255477905273, -0.002377331256866455, -0.002270936965942383, -0.0021645426750183105, -0.0020581483840942383, -0.001951754093170166, -0.0018453598022460938, -0.0017389655113220215, -0.0016325712203979492, -0.001526176929473877, -0.0014197826385498047, -0.0013133883476257324, -0.0012069940567016602, -0.0011005997657775879, -0.0009942054748535156, -0.0008878111839294434, -0.0007814168930053711, -0.0006750226020812988, -0.0005686283111572266, -0.0004622340202331543, -0.00035583972930908203, -0.00024944543838500977, -0.0001430511474609375, -3.6656856536865234e-05, 6.973743438720703e-05, 0.0001761317253112793, 0.00028252601623535156, 0.00038892030715942383, 0.0004953145980834961, 0.0006017088890075684, 0.0007081031799316406, 0.0008144974708557129, 0.0009208917617797852, 0.0010272860527038574, 0.0011336803436279297, 0.001240074634552002, 0.0013464689254760742, 0.0014528632164001465, 0.0015592575073242188, 0.001665651798248291, 0.0017720460891723633, 0.0018784403800964355, 0.001984834671020508, 0.00209122896194458, 0.0021976232528686523, 0.0023040175437927246, 0.002410411834716797, 0.002516806125640869, 0.0026232004165649414, 0.0027295947074890137, 0.002835988998413086, 0.002942383289337158, 0.0030487775802612305, 0.0031551718711853027, 0.003261566162109375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 10.0, 4.0, 8.0, 10.0, 10.0, 5.0, 11.0, 22.0, 27.0, 19.0, 33.0, 45.0, 54.0, 88.0, 109.0, 137.0, 116.0, 69.0, 38.0, 33.0, 23.0, 24.0, 16.0, 15.0, 15.0, 7.0, 5.0, 9.0, 7.0, 4.0, 3.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0008630752563476562, -0.0008345544338226318, -0.0008060336112976074, -0.000777512788772583, -0.0007489919662475586, -0.0007204711437225342, -0.0006919503211975098, -0.0006634294986724854, -0.0006349086761474609, -0.0006063878536224365, -0.0005778670310974121, -0.0005493462085723877, -0.0005208253860473633, -0.0004923045635223389, -0.00046378374099731445, -0.00043526291847229004, -0.0004067420959472656, -0.0003782212734222412, -0.0003497004508972168, -0.0003211796283721924, -0.00029265880584716797, -0.00026413798332214355, -0.00023561716079711914, -0.00020709633827209473, -0.0001785755157470703, -0.0001500546932220459, -0.00012153387069702148, -9.301304817199707e-05, -6.449222564697266e-05, -3.597140312194824e-05, -7.450580596923828e-06, 2.1070241928100586e-05, 4.9591064453125e-05, 7.811188697814941e-05, 0.00010663270950317383, 0.00013515353202819824, 0.00016367435455322266, 0.00019219517707824707, 0.00022071599960327148, 0.0002492368221282959, 0.0002777576446533203, 0.0003062784671783447, 0.00033479928970336914, 0.00036332011222839355, 0.00039184093475341797, 0.0004203617572784424, 0.0004488825798034668, 0.0004774034023284912, 0.0005059242248535156, 0.00053444504737854, 0.0005629658699035645, 0.0005914866924285889, 0.0006200075149536133, 0.0006485283374786377, 0.0006770491600036621, 0.0007055699825286865, 0.0007340908050537109, 0.0007626116275787354, 0.0007911324501037598, 0.0008196532726287842, 0.0008481740951538086, 0.000876694917678833, 0.0009052157402038574, 0.0009337365627288818, 0.0009622573852539062]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 9.0, 10.0, 12.0, 15.0, 18.0, 17.0, 31.0, 39.0, 44.0, 68.0, 85.0, 108.0, 112.0, 81.0, 80.0, 63.0, 34.0, 25.0, 29.0, 16.0, 21.0, 15.0, 11.0, 17.0, 8.0, 3.0, 6.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.09977977722883224, -0.096879743039608, -0.09397970139980316, -0.09107966721057892, -0.08817963302135468, -0.08527959138154984, -0.08237955719232559, -0.07947951555252075, -0.07657948136329651, -0.07367944717407227, -0.07077940553426743, -0.06787937134504318, -0.06497932970523834, -0.0620792955160141, -0.059179261326789856, -0.056279223412275314, -0.05337918549776077, -0.05047914758324623, -0.04757910966873169, -0.044679075479507446, -0.041779037564992905, -0.03887899965047836, -0.03597896546125412, -0.03307892754673958, -0.030178889632225037, -0.027278851717710495, -0.024378815665841103, -0.02147877961397171, -0.01857874169945717, -0.015678703784942627, -0.012778667733073235, -0.009878631681203842, -0.006978586316108704, -0.004078549332916737, -0.0011785123497247696, 0.0017215246334671974, 0.004621561616659164, 0.0075215985998511314, 0.010421635583043098, 0.01332167163491249, 0.016221709549427032, 0.019121747463941574, 0.022021783515810966, 0.02492181956768036, 0.0278218574821949, 0.030721895396709442, 0.033621929585933685, 0.03652196750044823, 0.03942200541496277, 0.04232204332947731, 0.04522208124399185, 0.048122115433216095, 0.05102215334773064, 0.05392219126224518, 0.05682222545146942, 0.05972226336598396, 0.0626223012804985, 0.06552233546972275, 0.06842237710952759, 0.07132241129875183, 0.07422244548797607, 0.07712248712778091, 0.08002252131700516, 0.08292256295681, 0.08582259714603424]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 0.0, 3.0, 5.0, 6.0, 8.0, 10.0, 10.0, 11.0, 19.0, 17.0, 21.0, 28.0, 35.0, 38.0, 41.0, 39.0, 35.0, 31.0, 46.0, 59.0, 43.0, 54.0, 45.0, 36.0, 52.0, 43.0, 55.0, 29.0, 29.0, 34.0, 18.0, 17.0, 18.0, 16.0, 10.0, 11.0, 12.0, 6.0, 9.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06261952221393585, -0.060358162969350815, -0.05809680372476578, -0.05583544820547104, -0.053574088960886, -0.051312729716300964, -0.049051374197006226, -0.04679001495242119, -0.04452865570783615, -0.042267296463251114, -0.04000593721866608, -0.03774458169937134, -0.0354832224547863, -0.03322186321020126, -0.030960505828261375, -0.028699148446321487, -0.02643778920173645, -0.024176429957151413, -0.021915072575211525, -0.019653715193271637, -0.0173923559486866, -0.015130997635424137, -0.012869639322161674, -0.010608281940221786, -0.00834692269563675, -0.006085564382374287, -0.003824206069111824, -0.0015628477558493614, 0.0006985105574131012, 0.002959868870675564, 0.005221227183938026, 0.007482584565877914, 0.009743936359882355, 0.012005294673144817, 0.01426665298640728, 0.016528010368347168, 0.018789369612932205, 0.021050728857517242, 0.02331208623945713, 0.02557344362139702, 0.027834802865982056, 0.030096162110567093, 0.03235752135515213, 0.03461887687444687, 0.036880236119031906, 0.03914159536361694, 0.04140295088291168, 0.04366431012749672, 0.04592566937208176, 0.048187028616666794, 0.05044838786125183, 0.05270974338054657, 0.05497110262513161, 0.057232461869716644, 0.05949381738901138, 0.06175517663359642, 0.06401653587818146, 0.0662778913974762, 0.06853925436735153, 0.07080060988664627, 0.0730619728565216, 0.07532332837581635, 0.07758468389511108, 0.07984603941440582, 0.08210740238428116]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 3.0, 9.0, 10.0, 13.0, 18.0, 29.0, 54.0, 94.0, 116.0, 200.0, 291.0, 468.0, 712.0, 1131.0, 1794.0, 2828.0, 4513.0, 7481.0, 12280.0, 21253.0, 36814.0, 68490.0, 143932.0, 337373.0, 207498.0, 89141.0, 46923.0, 26059.0, 15268.0, 9012.0, 5437.0, 3392.0, 2143.0, 1380.0, 845.0, 574.0, 324.0, 230.0, 144.0, 96.0, 53.0, 46.0, 32.0, 15.0, 18.0, 8.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1407470703125, -0.13600730895996094, -0.13126754760742188, -0.1265277862548828, -0.12178802490234375, -0.11704826354980469, -0.11230850219726562, -0.10756874084472656, -0.1028289794921875, -0.09808921813964844, -0.09334945678710938, -0.08860969543457031, -0.08386993408203125, -0.07913017272949219, -0.07439041137695312, -0.06965065002441406, -0.064910888671875, -0.06017112731933594, -0.055431365966796875, -0.05069160461425781, -0.04595184326171875, -0.04121208190917969, -0.036472320556640625, -0.03173255920410156, -0.0269927978515625, -0.022253036499023438, -0.017513275146484375, -0.012773513793945312, -0.00803375244140625, -0.0032939910888671875, 0.001445770263671875, 0.0061855316162109375, 0.01092529296875, 0.015665054321289062, 0.020404815673828125, 0.025144577026367188, 0.02988433837890625, 0.03462409973144531, 0.039363861083984375, 0.04410362243652344, 0.0488433837890625, 0.05358314514160156, 0.058322906494140625, 0.06306266784667969, 0.06780242919921875, 0.07254219055175781, 0.07728195190429688, 0.08202171325683594, 0.086761474609375, 0.09150123596191406, 0.09624099731445312, 0.10098075866699219, 0.10572052001953125, 0.11046028137207031, 0.11520004272460938, 0.11993980407714844, 0.1246795654296875, 0.12941932678222656, 0.13415908813476562, 0.1388988494873047, 0.14363861083984375, 0.1483783721923828, 0.15311813354492188, 0.15785789489746094, 0.16259765625]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 3.0, 9.0, 7.0, 12.0, 11.0, 17.0, 18.0, 18.0, 22.0, 35.0, 22.0, 40.0, 39.0, 42.0, 26.0, 32.0, 54.0, 49.0, 42.0, 54.0, 45.0, 47.0, 54.0, 36.0, 54.0, 30.0, 31.0, 25.0, 28.0, 16.0, 9.0, 10.0, 17.0, 11.0, 11.0, 5.0, 6.0, 6.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059722900390625, -0.0577082633972168, -0.055693626403808594, -0.05367898941040039, -0.05166435241699219, -0.049649715423583984, -0.04763507843017578, -0.04562044143676758, -0.043605804443359375, -0.04159116744995117, -0.03957653045654297, -0.037561893463134766, -0.03554725646972656, -0.03353261947631836, -0.031517982482910156, -0.029503345489501953, -0.02748870849609375, -0.025474071502685547, -0.023459434509277344, -0.02144479751586914, -0.019430160522460938, -0.017415523529052734, -0.015400886535644531, -0.013386249542236328, -0.011371612548828125, -0.009356975555419922, -0.007342338562011719, -0.005327701568603516, -0.0033130645751953125, -0.0012984275817871094, 0.0007162094116210938, 0.002730846405029297, 0.0047454833984375, 0.006760120391845703, 0.008774757385253906, 0.01078939437866211, 0.012804031372070312, 0.014818668365478516, 0.01683330535888672, 0.018847942352294922, 0.020862579345703125, 0.022877216339111328, 0.02489185333251953, 0.026906490325927734, 0.028921127319335938, 0.03093576431274414, 0.032950401306152344, 0.03496503829956055, 0.03697967529296875, 0.03899431228637695, 0.041008949279785156, 0.04302358627319336, 0.04503822326660156, 0.047052860260009766, 0.04906749725341797, 0.05108213424682617, 0.053096771240234375, 0.05511140823364258, 0.05712604522705078, 0.059140682220458984, 0.06115531921386719, 0.06316995620727539, 0.0651845932006836, 0.0671992301940918, 0.0692138671875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 5.0, 4.0, 4.0, 7.0, 13.0, 11.0, 33.0, 45.0, 51.0, 91.0, 105.0, 150.0, 223.0, 297.0, 416.0, 602.0, 857.0, 1262.0, 1863.0, 2579.0, 3772.0, 5648.0, 8507.0, 13296.0, 20611.0, 33465.0, 56840.0, 102353.0, 215231.0, 277717.0, 126009.0, 67874.0, 39535.0, 23784.0, 15015.0, 9778.0, 6495.0, 4379.0, 2984.0, 1963.0, 1370.0, 954.0, 713.0, 497.0, 361.0, 232.0, 158.0, 133.0, 76.0, 68.0, 42.0, 23.0, 23.0, 17.0, 8.0, 11.0, 2.0, 4.0, 3.0, 4.0], "bins": [-0.12060546875, -0.11696815490722656, -0.11333084106445312, -0.10969352722167969, -0.10605621337890625, -0.10241889953613281, -0.09878158569335938, -0.09514427185058594, -0.0915069580078125, -0.08786964416503906, -0.08423233032226562, -0.08059501647949219, -0.07695770263671875, -0.07332038879394531, -0.06968307495117188, -0.06604576110839844, -0.062408447265625, -0.05877113342285156, -0.055133819580078125, -0.05149650573730469, -0.04785919189453125, -0.04422187805175781, -0.040584564208984375, -0.03694725036621094, -0.0333099365234375, -0.029672622680664062, -0.026035308837890625, -0.022397994995117188, -0.01876068115234375, -0.015123367309570312, -0.011486053466796875, -0.007848739624023438, -0.00421142578125, -0.0005741119384765625, 0.003063201904296875, 0.0067005157470703125, 0.01033782958984375, 0.013975143432617188, 0.017612457275390625, 0.021249771118164062, 0.0248870849609375, 0.028524398803710938, 0.032161712646484375, 0.03579902648925781, 0.03943634033203125, 0.04307365417480469, 0.046710968017578125, 0.05034828186035156, 0.053985595703125, 0.05762290954589844, 0.061260223388671875, 0.06489753723144531, 0.06853485107421875, 0.07217216491699219, 0.07580947875976562, 0.07944679260253906, 0.0830841064453125, 0.08672142028808594, 0.09035873413085938, 0.09399604797363281, 0.09763336181640625, 0.10127067565917969, 0.10490798950195312, 0.10854530334472656, 0.1121826171875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 1.0, 2.0, 5.0, 7.0, 10.0, 14.0, 11.0, 5.0, 21.0, 18.0, 17.0, 27.0, 24.0, 15.0, 37.0, 38.0, 26.0, 31.0, 41.0, 42.0, 36.0, 42.0, 33.0, 48.0, 38.0, 43.0, 44.0, 40.0, 30.0, 35.0, 28.0, 32.0, 25.0, 18.0, 20.0, 16.0, 17.0, 12.0, 5.0, 8.0, 5.0, 10.0, 12.0, 2.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.033660888671875, -0.03256034851074219, -0.031459808349609375, -0.030359268188476562, -0.02925872802734375, -0.028158187866210938, -0.027057647705078125, -0.025957107543945312, -0.0248565673828125, -0.023756027221679688, -0.022655487060546875, -0.021554946899414062, -0.02045440673828125, -0.019353866577148438, -0.018253326416015625, -0.017152786254882812, -0.01605224609375, -0.014951705932617188, -0.013851165771484375, -0.012750625610351562, -0.01165008544921875, -0.010549545288085938, -0.009449005126953125, -0.008348464965820312, -0.0072479248046875, -0.0061473846435546875, -0.005046844482421875, -0.0039463043212890625, -0.00284576416015625, -0.0017452239990234375, -0.000644683837890625, 0.0004558563232421875, 0.001556396484375, 0.0026569366455078125, 0.003757476806640625, 0.0048580169677734375, 0.00595855712890625, 0.0070590972900390625, 0.008159637451171875, 0.009260177612304688, 0.0103607177734375, 0.011461257934570312, 0.012561798095703125, 0.013662338256835938, 0.01476287841796875, 0.015863418579101562, 0.016963958740234375, 0.018064498901367188, 0.0191650390625, 0.020265579223632812, 0.021366119384765625, 0.022466659545898438, 0.02356719970703125, 0.024667739868164062, 0.025768280029296875, 0.026868820190429688, 0.0279693603515625, 0.029069900512695312, 0.030170440673828125, 0.03127098083496094, 0.03237152099609375, 0.03347206115722656, 0.034572601318359375, 0.03567314147949219, 0.036773681640625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 4.0, 10.0, 10.0, 19.0, 19.0, 20.0, 38.0, 42.0, 70.0, 127.0, 167.0, 274.0, 516.0, 847.0, 1532.0, 2592.0, 4648.0, 9101.0, 19439.0, 48697.0, 705273.0, 184919.0, 37265.0, 15769.0, 7625.0, 4050.0, 2252.0, 1276.0, 750.0, 452.0, 258.0, 165.0, 109.0, 48.0, 44.0, 29.0, 30.0, 17.0, 10.0, 7.0, 7.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.017669677734375, -0.01714801788330078, -0.016626358032226562, -0.016104698181152344, -0.015583038330078125, -0.015061378479003906, -0.014539718627929688, -0.014018058776855469, -0.01349639892578125, -0.012974739074707031, -0.012453079223632812, -0.011931419372558594, -0.011409759521484375, -0.010888099670410156, -0.010366439819335938, -0.009844779968261719, -0.0093231201171875, -0.008801460266113281, -0.008279800415039062, -0.007758140563964844, -0.007236480712890625, -0.006714820861816406, -0.0061931610107421875, -0.005671501159667969, -0.00514984130859375, -0.004628181457519531, -0.0041065216064453125, -0.0035848617553710938, -0.003063201904296875, -0.0025415420532226562, -0.0020198822021484375, -0.0014982223510742188, -0.0009765625, -0.00045490264892578125, 6.67572021484375e-05, 0.0005884170532226562, 0.001110076904296875, 0.0016317367553710938, 0.0021533966064453125, 0.0026750564575195312, 0.00319671630859375, 0.0037183761596679688, 0.0042400360107421875, 0.004761695861816406, 0.005283355712890625, 0.005805015563964844, 0.0063266754150390625, 0.006848335266113281, 0.0073699951171875, 0.007891654968261719, 0.008413314819335938, 0.008934974670410156, 0.009456634521484375, 0.009978294372558594, 0.010499954223632812, 0.011021614074707031, 0.01154327392578125, 0.012064933776855469, 0.012586593627929688, 0.013108253479003906, 0.013629913330078125, 0.014151573181152344, 0.014673233032226562, 0.015194892883300781, 0.015716552734375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 6.0, 7.0, 0.0, 7.0, 20.0, 18.0, 0.0, 15.0, 28.0, 51.0, 0.0, 75.0, 90.0, 132.0, 0.0, 134.0, 98.0, 95.0, 0.0, 68.0, 48.0, 34.0, 0.0, 19.0, 24.0, 8.0, 0.0, 6.0, 7.0, 6.0, 0.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2516975402832031e-06, -1.2069940567016602e-06, -1.1622905731201172e-06, -1.1175870895385742e-06, -1.0728836059570312e-06, -1.0281801223754883e-06, -9.834766387939453e-07, -9.387731552124023e-07, -8.940696716308594e-07, -8.493661880493164e-07, -8.046627044677734e-07, -7.599592208862305e-07, -7.152557373046875e-07, -6.705522537231445e-07, -6.258487701416016e-07, -5.811452865600586e-07, -5.364418029785156e-07, -4.917383193969727e-07, -4.470348358154297e-07, -4.023313522338867e-07, -3.5762786865234375e-07, -3.129243850708008e-07, -2.682209014892578e-07, -2.2351741790771484e-07, -1.7881393432617188e-07, -1.341104507446289e-07, -8.940696716308594e-08, -4.470348358154297e-08, 0.0, 4.470348358154297e-08, 8.940696716308594e-08, 1.341104507446289e-07, 1.7881393432617188e-07, 2.2351741790771484e-07, 2.682209014892578e-07, 3.129243850708008e-07, 3.5762786865234375e-07, 4.023313522338867e-07, 4.470348358154297e-07, 4.917383193969727e-07, 5.364418029785156e-07, 5.811452865600586e-07, 6.258487701416016e-07, 6.705522537231445e-07, 7.152557373046875e-07, 7.599592208862305e-07, 8.046627044677734e-07, 8.493661880493164e-07, 8.940696716308594e-07, 9.387731552124023e-07, 9.834766387939453e-07, 1.0281801223754883e-06, 1.0728836059570312e-06, 1.1175870895385742e-06, 1.1622905731201172e-06, 1.2069940567016602e-06, 1.2516975402832031e-06, 1.296401023864746e-06, 1.341104507446289e-06, 1.385807991027832e-06, 1.430511474609375e-06, 1.475214958190918e-06, 1.519918441772461e-06, 1.564621925354004e-06, 1.6093254089355469e-06]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 4.0, 5.0, 17.0, 8.0, 21.0, 40.0, 31.0, 56.0, 85.0, 127.0, 158.0, 191.0, 324.0, 429.0, 565.0, 858.0, 1296.0, 1902.0, 2936.0, 4833.0, 8376.0, 15401.0, 33773.0, 127872.0, 741985.0, 56657.0, 22228.0, 10955.0, 6270.0, 3760.0, 2244.0, 1505.0, 1080.0, 698.0, 542.0, 338.0, 252.0, 212.0, 136.0, 98.0, 79.0, 59.0, 52.0, 29.0, 19.0, 11.0, 18.0, 6.0, 2.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.01727294921875, -0.016753435134887695, -0.01623392105102539, -0.015714406967163086, -0.015194892883300781, -0.014675378799438477, -0.014155864715576172, -0.013636350631713867, -0.013116836547851562, -0.012597322463989258, -0.012077808380126953, -0.011558294296264648, -0.011038780212402344, -0.010519266128540039, -0.009999752044677734, -0.00948023796081543, -0.008960723876953125, -0.00844120979309082, -0.007921695709228516, -0.007402181625366211, -0.006882667541503906, -0.0063631534576416016, -0.005843639373779297, -0.005324125289916992, -0.0048046112060546875, -0.004285097122192383, -0.003765583038330078, -0.0032460689544677734, -0.0027265548706054688, -0.002207040786743164, -0.0016875267028808594, -0.0011680126190185547, -0.00064849853515625, -0.0001289844512939453, 0.0003905296325683594, 0.0009100437164306641, 0.0014295578002929688, 0.0019490718841552734, 0.002468585968017578, 0.002988100051879883, 0.0035076141357421875, 0.004027128219604492, 0.004546642303466797, 0.0050661563873291016, 0.005585670471191406, 0.006105184555053711, 0.006624698638916016, 0.00714421272277832, 0.007663726806640625, 0.00818324089050293, 0.008702754974365234, 0.009222269058227539, 0.009741783142089844, 0.010261297225952148, 0.010780811309814453, 0.011300325393676758, 0.011819839477539062, 0.012339353561401367, 0.012858867645263672, 0.013378381729125977, 0.013897895812988281, 0.014417409896850586, 0.01493692398071289, 0.015456438064575195, 0.0159759521484375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 6.0, 6.0, 8.0, 12.0, 9.0, 9.0, 16.0, 26.0, 29.0, 46.0, 80.0, 426.0, 116.0, 56.0, 30.0, 18.0, 17.0, 13.0, 17.0, 9.0, 13.0, 5.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-0.005374908447265625, -0.005228400230407715, -0.005081892013549805, -0.0049353837966918945, -0.004788875579833984, -0.004642367362976074, -0.004495859146118164, -0.004349350929260254, -0.004202842712402344, -0.004056334495544434, -0.0039098262786865234, -0.0037633180618286133, -0.003616809844970703, -0.003470301628112793, -0.003323793411254883, -0.0031772851943969727, -0.0030307769775390625, -0.0028842687606811523, -0.002737760543823242, -0.002591252326965332, -0.002444744110107422, -0.0022982358932495117, -0.0021517276763916016, -0.0020052194595336914, -0.0018587112426757812, -0.001712203025817871, -0.001565694808959961, -0.0014191865921020508, -0.0012726783752441406, -0.0011261701583862305, -0.0009796619415283203, -0.0008331537246704102, -0.0006866455078125, -0.0005401372909545898, -0.0003936290740966797, -0.00024712085723876953, -0.00010061264038085938, 4.589557647705078e-05, 0.00019240379333496094, 0.0003389120101928711, 0.00048542022705078125, 0.0006319284439086914, 0.0007784366607666016, 0.0009249448776245117, 0.0010714530944824219, 0.001217961311340332, 0.0013644695281982422, 0.0015109777450561523, 0.0016574859619140625, 0.0018039941787719727, 0.0019505023956298828, 0.002097010612487793, 0.002243518829345703, 0.0023900270462036133, 0.0025365352630615234, 0.0026830434799194336, 0.0028295516967773438, 0.002976059913635254, 0.003122568130493164, 0.0032690763473510742, 0.0034155845642089844, 0.0035620927810668945, 0.0037086009979248047, 0.003855109214782715, 0.004001617431640625]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 6.0, 1.0, 6.0, 7.0, 10.0, 16.0, 15.0, 20.0, 23.0, 31.0, 45.0, 56.0, 69.0, 110.0, 129.0, 118.0, 68.0, 68.0, 49.0, 39.0, 21.0, 19.0, 18.0, 14.0, 11.0, 10.0, 6.0, 8.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08501093089580536, -0.08204293251037598, -0.0790749341249466, -0.07610693573951721, -0.07313893735408783, -0.07017094641923904, -0.06720294803380966, -0.06423494964838028, -0.0612669512629509, -0.058298952877521515, -0.05533095449209213, -0.05236295983195305, -0.049394961446523666, -0.046426963061094284, -0.0434589684009552, -0.04049097001552582, -0.037522971630096436, -0.03455497324466705, -0.03158697485923767, -0.028618980199098587, -0.025650981813669205, -0.022682983428239822, -0.01971498690545559, -0.016746990382671356, -0.013778991997241974, -0.010810994543135166, -0.007842997089028358, -0.004874999634921551, -0.001907002180814743, 0.0010609952732920647, 0.004028992727398872, 0.0069969892501831055, 0.009964995086193085, 0.012932992540299892, 0.0159009899944067, 0.018868986517190933, 0.021836984902620316, 0.024804983288049698, 0.02777297981083393, 0.030740976333618164, 0.033708974719047546, 0.03667697310447693, 0.03964497148990631, 0.042612966150045395, 0.04558096453547478, 0.04854896292090416, 0.05151695758104324, 0.054484955966472626, 0.05745295435190201, 0.06042095273733139, 0.06338895112276077, 0.06635694950819016, 0.06932494044303894, 0.07229293882846832, 0.0752609372138977, 0.07822893559932709, 0.08119693398475647, 0.08416493237018585, 0.08713293075561523, 0.09010092914104462, 0.093068927526474, 0.09603691846132278, 0.09900491684675217, 0.10197291523218155, 0.10494091361761093]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 3.0, 4.0, 9.0, 8.0, 14.0, 18.0, 21.0, 16.0, 35.0, 36.0, 36.0, 33.0, 42.0, 45.0, 30.0, 39.0, 36.0, 42.0, 62.0, 52.0, 43.0, 46.0, 39.0, 40.0, 36.0, 31.0, 30.0, 32.0, 27.0, 24.0, 15.0, 12.0, 13.0, 4.0, 4.0, 6.0, 9.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06216754391789436, -0.06002369895577431, -0.05787985026836395, -0.055736005306243896, -0.05359215661883354, -0.051448311656713486, -0.04930446296930313, -0.047160618007183075, -0.04501677304506302, -0.04287292808294296, -0.04072907939553261, -0.03858523443341255, -0.0364413857460022, -0.03429754078388214, -0.032153695821762085, -0.03000984713435173, -0.027865998446941376, -0.02572215162217617, -0.023578304797410965, -0.02143445983529091, -0.019290611147880554, -0.017146766185760498, -0.015002919360995293, -0.012859072536230087, -0.010715225711464882, -0.008571378886699677, -0.0064275325275957584, -0.00428368616849184, -0.002139839343726635, 4.007481038570404e-06, 0.002147853374481201, 0.0042917001992464066, 0.00643555074930191, 0.008579397574067116, 0.010723244398832321, 0.012867090292274952, 0.015010937117040157, 0.017154783010482788, 0.019298629835247993, 0.0214424766600132, 0.023586323484778404, 0.02573017030954361, 0.027874017134308815, 0.03001786395907402, 0.03216170892119408, 0.03430555760860443, 0.03644940257072449, 0.03859324753284454, 0.0407370962202549, 0.042880941182374954, 0.04502478986978531, 0.047168634831905365, 0.04931248351931572, 0.051456328481435776, 0.05360017716884613, 0.055744022130966187, 0.05788786709308624, 0.0600317120552063, 0.06217556074261665, 0.06431940943002701, 0.06646325439214706, 0.06860709935426712, 0.07075094431638718, 0.07289479672908783, 0.07503864169120789]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 14.0, 15.0, 22.0, 42.0, 67.0, 93.0, 140.0, 227.0, 306.0, 488.0, 713.0, 1196.0, 1970.0, 3239.0, 5575.0, 9800.0, 18392.0, 36332.0, 79313.0, 199280.0, 850264.0, 2286208.0, 439220.0, 135742.0, 59674.0, 29647.0, 15236.0, 8588.0, 4776.0, 2838.0, 1815.0, 1035.0, 670.0, 434.0, 304.0, 182.0, 115.0, 98.0, 63.0, 48.0, 29.0, 17.0, 13.0, 9.0, 6.0, 13.0, 4.0, 9.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0906982421875, -0.08711624145507812, -0.08353424072265625, -0.07995223999023438, -0.0763702392578125, -0.07278823852539062, -0.06920623779296875, -0.06562423706054688, -0.062042236328125, -0.058460235595703125, -0.05487823486328125, -0.051296234130859375, -0.0477142333984375, -0.044132232666015625, -0.04055023193359375, -0.036968231201171875, -0.03338623046875, -0.029804229736328125, -0.02622222900390625, -0.022640228271484375, -0.0190582275390625, -0.015476226806640625, -0.01189422607421875, -0.008312225341796875, -0.004730224609375, -0.001148223876953125, 0.00243377685546875, 0.006015777587890625, 0.0095977783203125, 0.013179779052734375, 0.01676177978515625, 0.020343780517578125, 0.02392578125, 0.027507781982421875, 0.03108978271484375, 0.034671783447265625, 0.0382537841796875, 0.041835784912109375, 0.04541778564453125, 0.048999786376953125, 0.052581787109375, 0.056163787841796875, 0.05974578857421875, 0.06332778930664062, 0.0669097900390625, 0.07049179077148438, 0.07407379150390625, 0.07765579223632812, 0.08123779296875, 0.08481979370117188, 0.08840179443359375, 0.09198379516601562, 0.0955657958984375, 0.09914779663085938, 0.10272979736328125, 0.10631179809570312, 0.109893798828125, 0.11347579956054688, 0.11705780029296875, 0.12063980102539062, 0.1242218017578125, 0.12780380249023438, 0.13138580322265625, 0.13496780395507812, 0.1385498046875]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 3.0, 4.0, 6.0, 3.0, 9.0, 9.0, 12.0, 22.0, 19.0, 25.0, 37.0, 24.0, 34.0, 37.0, 42.0, 48.0, 51.0, 39.0, 43.0, 45.0, 59.0, 47.0, 44.0, 47.0, 45.0, 37.0, 29.0, 26.0, 28.0, 32.0, 20.0, 18.0, 17.0, 11.0, 6.0, 3.0, 6.0, 7.0, 3.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.039703369140625, -0.038402557373046875, -0.03710174560546875, -0.035800933837890625, -0.0345001220703125, -0.033199310302734375, -0.03189849853515625, -0.030597686767578125, -0.029296875, -0.027996063232421875, -0.02669525146484375, -0.025394439697265625, -0.0240936279296875, -0.022792816162109375, -0.02149200439453125, -0.020191192626953125, -0.018890380859375, -0.017589569091796875, -0.01628875732421875, -0.014987945556640625, -0.0136871337890625, -0.012386322021484375, -0.01108551025390625, -0.009784698486328125, -0.00848388671875, -0.007183074951171875, -0.00588226318359375, -0.004581451416015625, -0.0032806396484375, -0.001979827880859375, -0.00067901611328125, 0.000621795654296875, 0.001922607421875, 0.003223419189453125, 0.00452423095703125, 0.005825042724609375, 0.0071258544921875, 0.008426666259765625, 0.00972747802734375, 0.011028289794921875, 0.0123291015625, 0.013629913330078125, 0.01493072509765625, 0.016231536865234375, 0.0175323486328125, 0.018833160400390625, 0.02013397216796875, 0.021434783935546875, 0.022735595703125, 0.024036407470703125, 0.02533721923828125, 0.026638031005859375, 0.0279388427734375, 0.029239654541015625, 0.03054046630859375, 0.031841278076171875, 0.03314208984375, 0.034442901611328125, 0.03574371337890625, 0.037044525146484375, 0.0383453369140625, 0.039646148681640625, 0.04094696044921875, 0.042247772216796875, 0.043548583984375]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 7.0, 9.0, 18.0, 21.0, 31.0, 52.0, 56.0, 89.0, 141.0, 205.0, 326.0, 388.0, 717.0, 1066.0, 1629.0, 2669.0, 4285.0, 7117.0, 12302.0, 21600.0, 39530.0, 74789.0, 152004.0, 358923.0, 1119708.0, 1555006.0, 459599.0, 185975.0, 89594.0, 45833.0, 25206.0, 13962.0, 8251.0, 4868.0, 2973.0, 1891.0, 1176.0, 757.0, 512.0, 334.0, 212.0, 128.0, 101.0, 69.0, 54.0, 29.0, 20.0, 19.0, 15.0, 5.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.07171630859375, -0.0694122314453125, -0.067108154296875, -0.0648040771484375, -0.0625, -0.0601959228515625, -0.057891845703125, -0.0555877685546875, -0.05328369140625, -0.0509796142578125, -0.048675537109375, -0.0463714599609375, -0.0440673828125, -0.0417633056640625, -0.039459228515625, -0.0371551513671875, -0.03485107421875, -0.0325469970703125, -0.030242919921875, -0.0279388427734375, -0.025634765625, -0.0233306884765625, -0.021026611328125, -0.0187225341796875, -0.01641845703125, -0.0141143798828125, -0.011810302734375, -0.0095062255859375, -0.0072021484375, -0.0048980712890625, -0.002593994140625, -0.0002899169921875, 0.00201416015625, 0.0043182373046875, 0.006622314453125, 0.0089263916015625, 0.01123046875, 0.0135345458984375, 0.015838623046875, 0.0181427001953125, 0.02044677734375, 0.0227508544921875, 0.025054931640625, 0.0273590087890625, 0.0296630859375, 0.0319671630859375, 0.034271240234375, 0.0365753173828125, 0.03887939453125, 0.0411834716796875, 0.043487548828125, 0.0457916259765625, 0.048095703125, 0.0503997802734375, 0.052703857421875, 0.0550079345703125, 0.05731201171875, 0.0596160888671875, 0.061920166015625, 0.0642242431640625, 0.0665283203125, 0.0688323974609375, 0.071136474609375, 0.0734405517578125, 0.07574462890625]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 7.0, 5.0, 7.0, 10.0, 11.0, 10.0, 29.0, 26.0, 35.0, 33.0, 57.0, 52.0, 76.0, 82.0, 95.0, 118.0, 143.0, 192.0, 225.0, 280.0, 318.0, 319.0, 319.0, 301.0, 223.0, 231.0, 190.0, 122.0, 98.0, 92.0, 85.0, 59.0, 40.0, 35.0, 35.0, 19.0, 25.0, 17.0, 11.0, 13.0, 8.0, 4.0, 5.0, 8.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0222930908203125, -0.021649599075317383, -0.021006107330322266, -0.02036261558532715, -0.01971912384033203, -0.019075632095336914, -0.018432140350341797, -0.01778864860534668, -0.017145156860351562, -0.016501665115356445, -0.015858173370361328, -0.015214681625366211, -0.014571189880371094, -0.013927698135375977, -0.01328420639038086, -0.012640714645385742, -0.011997222900390625, -0.011353731155395508, -0.01071023941040039, -0.010066747665405273, -0.009423255920410156, -0.008779764175415039, -0.008136272430419922, -0.007492780685424805, -0.0068492889404296875, -0.00620579719543457, -0.005562305450439453, -0.004918813705444336, -0.004275321960449219, -0.0036318302154541016, -0.0029883384704589844, -0.002344846725463867, -0.00170135498046875, -0.0010578632354736328, -0.0004143714904785156, 0.00022912025451660156, 0.0008726119995117188, 0.001516103744506836, 0.002159595489501953, 0.0028030872344970703, 0.0034465789794921875, 0.004090070724487305, 0.004733562469482422, 0.005377054214477539, 0.006020545959472656, 0.0066640377044677734, 0.007307529449462891, 0.007951021194458008, 0.008594512939453125, 0.009238004684448242, 0.00988149642944336, 0.010524988174438477, 0.011168479919433594, 0.011811971664428711, 0.012455463409423828, 0.013098955154418945, 0.013742446899414062, 0.01438593864440918, 0.015029430389404297, 0.015672922134399414, 0.01631641387939453, 0.01695990562438965, 0.017603397369384766, 0.018246889114379883, 0.018890380859375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 2.0, 1.0, 2.0, 7.0, 3.0, 7.0, 8.0, 13.0, 17.0, 19.0, 24.0, 34.0, 61.0, 85.0, 77.0, 109.0, 137.0, 92.0, 56.0, 59.0, 41.0, 42.0, 23.0, 22.0, 15.0, 16.0, 4.0, 3.0, 6.0, 3.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05782319977879524, -0.05584748834371567, -0.05387178063392639, -0.05189606919884682, -0.04992035776376724, -0.047944650053977966, -0.04596893861889839, -0.04399322718381882, -0.04201751947402954, -0.040041808038949966, -0.03806610032916069, -0.036090388894081116, -0.03411467745900154, -0.03213896602392197, -0.03016325831413269, -0.028187546879053116, -0.02621183544397354, -0.024236125871539116, -0.02226041443645954, -0.020284704864025116, -0.01830899342894554, -0.016333283856511116, -0.01435757428407669, -0.01238186378031969, -0.01040615327656269, -0.00843044277280569, -0.006454732734709978, -0.0044790226966142654, -0.0025033121928572655, -0.0005276016891002655, 0.0014481078833341599, 0.00342381838709116, 0.005399532616138458, 0.007375243119895458, 0.009350953623652458, 0.011326663196086884, 0.013302373699843884, 0.015278084203600883, 0.01725379377603531, 0.019229505211114883, 0.02120521478354931, 0.023180924355983734, 0.02515663579106331, 0.027132345363497734, 0.02910805493593216, 0.031083766371011734, 0.03305947780609131, 0.035035185515880585, 0.03701089695096016, 0.038986608386039734, 0.04096231609582901, 0.042938027530908585, 0.04491373896598816, 0.046889446675777435, 0.04886515811085701, 0.050840869545936584, 0.05281657725572586, 0.054792288690805435, 0.05676799640059471, 0.058743707835674286, 0.06071941927075386, 0.06269513070583344, 0.06467083841562271, 0.06664654612541199, 0.06862226128578186]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 7.0, 12.0, 12.0, 13.0, 11.0, 17.0, 30.0, 26.0, 32.0, 32.0, 39.0, 36.0, 40.0, 39.0, 52.0, 36.0, 46.0, 47.0, 44.0, 41.0, 38.0, 39.0, 39.0, 42.0, 34.0, 32.0, 23.0, 25.0, 14.0, 21.0, 18.0, 10.0, 12.0, 10.0, 10.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03892144933342934, -0.03759174793958664, -0.03626204654574394, -0.034932345151901245, -0.03360264375805855, -0.03227294236421585, -0.030943239107728004, -0.029613537713885307, -0.02828383632004261, -0.026954134926199913, -0.025624433532357216, -0.02429473027586937, -0.022965028882026672, -0.021635327488183975, -0.020305626094341278, -0.01897592470049858, -0.017646223306655884, -0.016316521912813187, -0.01498682051897049, -0.013657118193805218, -0.01232741679996252, -0.010997715406119823, -0.009668013080954552, -0.008338311687111855, -0.007008610293269157, -0.00567890889942646, -0.004349207039922476, -0.0030195051804184914, -0.0016898037865757942, -0.0003601023927330971, 0.0009695999324321747, 0.002299301326274872, 0.003629002720117569, 0.004958704113960266, 0.0062884059734642506, 0.007618107832968235, 0.008947809226810932, 0.01027751062065363, 0.011607212945818901, 0.012936914339661598, 0.014266615733504295, 0.015596317127346992, 0.01692601852118969, 0.018255721777677536, 0.019585423171520233, 0.02091512456536293, 0.022244825959205627, 0.023574527353048325, 0.02490422874689102, 0.02623393014073372, 0.027563631534576416, 0.028893332928419113, 0.03022303432226181, 0.03155273571610451, 0.032882437109947205, 0.0342121422290802, 0.0355418398976326, 0.036871541291475296, 0.03820124268531799, 0.03953094407916069, 0.04086064547300339, 0.042190346866846085, 0.04352004826068878, 0.04484975337982178, 0.046179454773664474]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 9.0, 8.0, 13.0, 17.0, 31.0, 29.0, 46.0, 89.0, 102.0, 148.0, 237.0, 388.0, 626.0, 1033.0, 1837.0, 3253.0, 6072.0, 11793.0, 23322.0, 49744.0, 124828.0, 400746.0, 261912.0, 86604.0, 37256.0, 17939.0, 9110.0, 4870.0, 2641.0, 1472.0, 876.0, 509.0, 341.0, 200.0, 145.0, 94.0, 58.0, 36.0, 32.0, 34.0, 14.0, 10.0, 5.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0], "bins": [-0.0193328857421875, -0.01874375343322754, -0.018154621124267578, -0.017565488815307617, -0.016976356506347656, -0.016387224197387695, -0.015798091888427734, -0.015208959579467773, -0.014619827270507812, -0.014030694961547852, -0.01344156265258789, -0.01285243034362793, -0.012263298034667969, -0.011674165725708008, -0.011085033416748047, -0.010495901107788086, -0.009906768798828125, -0.009317636489868164, -0.008728504180908203, -0.008139371871948242, -0.007550239562988281, -0.00696110725402832, -0.006371974945068359, -0.0057828426361083984, -0.0051937103271484375, -0.0046045780181884766, -0.004015445709228516, -0.0034263134002685547, -0.0028371810913085938, -0.002248048782348633, -0.0016589164733886719, -0.001069784164428711, -0.00048065185546875, 0.00010848045349121094, 0.0006976127624511719, 0.0012867450714111328, 0.0018758773803710938, 0.0024650096893310547, 0.0030541419982910156, 0.0036432743072509766, 0.0042324066162109375, 0.0048215389251708984, 0.005410671234130859, 0.00599980354309082, 0.006588935852050781, 0.007178068161010742, 0.007767200469970703, 0.008356332778930664, 0.008945465087890625, 0.009534597396850586, 0.010123729705810547, 0.010712862014770508, 0.011301994323730469, 0.01189112663269043, 0.01248025894165039, 0.013069391250610352, 0.013658523559570312, 0.014247655868530273, 0.014836788177490234, 0.015425920486450195, 0.016015052795410156, 0.016604185104370117, 0.017193317413330078, 0.01778244972229004, 0.01837158203125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 6.0, 3.0, 2.0, 10.0, 6.0, 6.0, 8.0, 24.0, 13.0, 16.0, 25.0, 14.0, 27.0, 41.0, 26.0, 41.0, 30.0, 52.0, 50.0, 41.0, 52.0, 44.0, 41.0, 46.0, 39.0, 45.0, 37.0, 42.0, 39.0, 21.0, 27.0, 20.0, 21.0, 14.0, 17.0, 13.0, 13.0, 10.0, 9.0, 8.0, 2.0, 3.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0408935546875, -0.039545536041259766, -0.03819751739501953, -0.0368494987487793, -0.03550148010253906, -0.03415346145629883, -0.032805442810058594, -0.03145742416381836, -0.030109405517578125, -0.02876138687133789, -0.027413368225097656, -0.026065349578857422, -0.024717330932617188, -0.023369312286376953, -0.02202129364013672, -0.020673274993896484, -0.01932525634765625, -0.017977237701416016, -0.01662921905517578, -0.015281200408935547, -0.013933181762695312, -0.012585163116455078, -0.011237144470214844, -0.00988912582397461, -0.008541107177734375, -0.007193088531494141, -0.005845069885253906, -0.004497051239013672, -0.0031490325927734375, -0.0018010139465332031, -0.00045299530029296875, 0.0008950233459472656, 0.0022430419921875, 0.0035910606384277344, 0.004939079284667969, 0.006287097930908203, 0.0076351165771484375, 0.008983135223388672, 0.010331153869628906, 0.01167917251586914, 0.013027191162109375, 0.01437520980834961, 0.015723228454589844, 0.017071247100830078, 0.018419265747070312, 0.019767284393310547, 0.02111530303955078, 0.022463321685791016, 0.02381134033203125, 0.025159358978271484, 0.02650737762451172, 0.027855396270751953, 0.029203414916992188, 0.030551433563232422, 0.031899452209472656, 0.03324747085571289, 0.034595489501953125, 0.03594350814819336, 0.037291526794433594, 0.03863954544067383, 0.03998756408691406, 0.0413355827331543, 0.04268360137939453, 0.044031620025634766, 0.045379638671875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 7.0, 10.0, 18.0, 25.0, 32.0, 37.0, 82.0, 102.0, 150.0, 202.0, 304.0, 406.0, 633.0, 956.0, 1492.0, 2327.0, 3837.0, 6410.0, 11180.0, 20518.0, 41465.0, 99456.0, 391149.0, 299545.0, 86187.0, 37116.0, 19028.0, 10294.0, 5819.0, 3476.0, 2151.0, 1323.0, 922.0, 609.0, 372.0, 249.0, 183.0, 145.0, 90.0, 51.0, 52.0, 34.0, 26.0, 26.0, 16.0, 11.0, 9.0, 5.0, 8.0, 2.0, 3.0, 6.0], "bins": [-0.02276611328125, -0.022114276885986328, -0.021462440490722656, -0.020810604095458984, -0.020158767700195312, -0.01950693130493164, -0.01885509490966797, -0.018203258514404297, -0.017551422119140625, -0.016899585723876953, -0.01624774932861328, -0.01559591293334961, -0.014944076538085938, -0.014292240142822266, -0.013640403747558594, -0.012988567352294922, -0.01233673095703125, -0.011684894561767578, -0.011033058166503906, -0.010381221771240234, -0.009729385375976562, -0.00907754898071289, -0.008425712585449219, -0.007773876190185547, -0.007122039794921875, -0.006470203399658203, -0.005818367004394531, -0.005166530609130859, -0.0045146942138671875, -0.0038628578186035156, -0.0032110214233398438, -0.002559185028076172, -0.0019073486328125, -0.0012555122375488281, -0.0006036758422851562, 4.8160552978515625e-05, 0.0006999969482421875, 0.0013518333435058594, 0.0020036697387695312, 0.002655506134033203, 0.003307342529296875, 0.003959178924560547, 0.004611015319824219, 0.005262851715087891, 0.0059146881103515625, 0.006566524505615234, 0.007218360900878906, 0.007870197296142578, 0.00852203369140625, 0.009173870086669922, 0.009825706481933594, 0.010477542877197266, 0.011129379272460938, 0.01178121566772461, 0.012433052062988281, 0.013084888458251953, 0.013736724853515625, 0.014388561248779297, 0.015040397644042969, 0.01569223403930664, 0.016344070434570312, 0.016995906829833984, 0.017647743225097656, 0.018299579620361328, 0.018951416015625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 8.0, 4.0, 7.0, 8.0, 13.0, 4.0, 15.0, 15.0, 15.0, 15.0, 25.0, 36.0, 31.0, 30.0, 26.0, 31.0, 27.0, 37.0, 35.0, 33.0, 40.0, 40.0, 42.0, 43.0, 39.0, 47.0, 24.0, 39.0, 36.0, 29.0, 27.0, 26.0, 27.0, 15.0, 16.0, 13.0, 5.0, 19.0, 19.0, 10.0, 5.0, 9.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0239410400390625, -0.023177146911621094, -0.022413253784179688, -0.02164936065673828, -0.020885467529296875, -0.02012157440185547, -0.019357681274414062, -0.018593788146972656, -0.01782989501953125, -0.017066001892089844, -0.016302108764648438, -0.015538215637207031, -0.014774322509765625, -0.014010429382324219, -0.013246536254882812, -0.012482643127441406, -0.01171875, -0.010954856872558594, -0.010190963745117188, -0.009427070617675781, -0.008663177490234375, -0.007899284362792969, -0.0071353912353515625, -0.006371498107910156, -0.00560760498046875, -0.004843711853027344, -0.0040798187255859375, -0.0033159255981445312, -0.002552032470703125, -0.0017881393432617188, -0.0010242462158203125, -0.00026035308837890625, 0.0005035400390625, 0.0012674331665039062, 0.0020313262939453125, 0.0027952194213867188, 0.003559112548828125, 0.004323005676269531, 0.0050868988037109375, 0.005850791931152344, 0.00661468505859375, 0.007378578186035156, 0.008142471313476562, 0.008906364440917969, 0.009670257568359375, 0.010434150695800781, 0.011198043823242188, 0.011961936950683594, 0.012725830078125, 0.013489723205566406, 0.014253616333007812, 0.015017509460449219, 0.015781402587890625, 0.01654529571533203, 0.017309188842773438, 0.018073081970214844, 0.01883697509765625, 0.019600868225097656, 0.020364761352539062, 0.02112865447998047, 0.021892547607421875, 0.02265644073486328, 0.023420333862304688, 0.024184226989746094, 0.0249481201171875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 8.0, 6.0, 5.0, 9.0, 12.0, 30.0, 28.0, 34.0, 44.0, 77.0, 94.0, 133.0, 171.0, 285.0, 363.0, 549.0, 766.0, 1203.0, 1831.0, 2772.0, 4547.0, 7764.0, 14019.0, 27761.0, 69361.0, 497039.0, 301535.0, 60391.0, 25310.0, 12830.0, 7155.0, 4379.0, 2714.0, 1701.0, 1149.0, 761.0, 508.0, 347.0, 242.0, 177.0, 123.0, 96.0, 66.0, 51.0, 31.0, 19.0, 15.0, 15.0, 10.0, 10.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.0016813278198242188, -0.001625165343284607, -0.0015690028667449951, -0.0015128403902053833, -0.0014566779136657715, -0.0014005154371261597, -0.0013443529605865479, -0.001288190484046936, -0.0012320280075073242, -0.0011758655309677124, -0.0011197030544281006, -0.0010635405778884888, -0.001007378101348877, -0.0009512156248092651, -0.0008950531482696533, -0.0008388906717300415, -0.0007827281951904297, -0.0007265657186508179, -0.0006704032421112061, -0.0006142407655715942, -0.0005580782890319824, -0.0005019158124923706, -0.0004457533359527588, -0.00038959085941314697, -0.00033342838287353516, -0.00027726590633392334, -0.00022110342979431152, -0.0001649409532546997, -0.00010877847671508789, -5.2616000175476074e-05, 3.546476364135742e-06, 5.970895290374756e-05, 0.00011587142944335938, 0.0001720339059829712, 0.000228196382522583, 0.0002843588590621948, 0.00034052133560180664, 0.00039668381214141846, 0.0004528462886810303, 0.0005090087652206421, 0.0005651712417602539, 0.0006213337182998657, 0.0006774961948394775, 0.0007336586713790894, 0.0007898211479187012, 0.000845983624458313, 0.0009021461009979248, 0.0009583085775375366, 0.0010144710540771484, 0.0010706335306167603, 0.001126796007156372, 0.0011829584836959839, 0.0012391209602355957, 0.0012952834367752075, 0.0013514459133148193, 0.0014076083898544312, 0.001463770866394043, 0.0015199333429336548, 0.0015760958194732666, 0.0016322582960128784, 0.0016884207725524902, 0.001744583249092102, 0.0018007457256317139, 0.0018569082021713257, 0.0019130706787109375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 0.0, 1.0, 0.0, 3.0, 0.0, 7.0, 0.0, 7.0, 0.0, 15.0, 15.0, 0.0, 17.0, 0.0, 20.0, 0.0, 32.0, 0.0, 45.0, 0.0, 45.0, 0.0, 68.0, 0.0, 68.0, 0.0, 87.0, 118.0, 0.0, 95.0, 0.0, 90.0, 0.0, 60.0, 0.0, 67.0, 0.0, 41.0, 0.0, 39.0, 0.0, 22.0, 15.0, 0.0, 17.0, 0.0, 4.0, 0.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0], "bins": [-1.0728836059570312e-06, -1.041218638420105e-06, -1.0095536708831787e-06, -9.778887033462524e-07, -9.462237358093262e-07, -9.145587682723999e-07, -8.828938007354736e-07, -8.512288331985474e-07, -8.195638656616211e-07, -7.878988981246948e-07, -7.562339305877686e-07, -7.245689630508423e-07, -6.92903995513916e-07, -6.612390279769897e-07, -6.295740604400635e-07, -5.979090929031372e-07, -5.662441253662109e-07, -5.345791578292847e-07, -5.029141902923584e-07, -4.7124922275543213e-07, -4.3958425521850586e-07, -4.079192876815796e-07, -3.762543201446533e-07, -3.4458935260772705e-07, -3.129243850708008e-07, -2.812594175338745e-07, -2.4959444999694824e-07, -2.1792948246002197e-07, -1.862645149230957e-07, -1.5459954738616943e-07, -1.2293457984924316e-07, -9.12696123123169e-08, -5.960464477539063e-08, -2.7939677238464355e-08, 3.725290298461914e-09, 3.5390257835388184e-08, 6.705522537231445e-08, 9.872019290924072e-08, 1.30385160446167e-07, 1.6205012798309326e-07, 1.9371509552001953e-07, 2.253800630569458e-07, 2.5704503059387207e-07, 2.8870999813079834e-07, 3.203749656677246e-07, 3.520399332046509e-07, 3.8370490074157715e-07, 4.153698682785034e-07, 4.470348358154297e-07, 4.78699803352356e-07, 5.103647708892822e-07, 5.420297384262085e-07, 5.736947059631348e-07, 6.05359673500061e-07, 6.370246410369873e-07, 6.686896085739136e-07, 7.003545761108398e-07, 7.320195436477661e-07, 7.636845111846924e-07, 7.953494787216187e-07, 8.270144462585449e-07, 8.586794137954712e-07, 8.903443813323975e-07, 9.220093488693237e-07, 9.5367431640625e-07]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 5.0, 5.0, 8.0, 15.0, 30.0, 30.0, 35.0, 51.0, 79.0, 122.0, 173.0, 277.0, 411.0, 584.0, 969.0, 1426.0, 2142.0, 3188.0, 5072.0, 8335.0, 13665.0, 24900.0, 51347.0, 138976.0, 559652.0, 128395.0, 49256.0, 23948.0, 13237.0, 7921.0, 4958.0, 3137.0, 2111.0, 1393.0, 898.0, 608.0, 364.0, 264.0, 180.0, 113.0, 79.0, 59.0, 43.0, 28.0, 24.0, 8.0, 13.0, 8.0, 4.0, 8.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0017271041870117188, -0.0016722232103347778, -0.001617342233657837, -0.001562461256980896, -0.001507580280303955, -0.0014526993036270142, -0.0013978183269500732, -0.0013429373502731323, -0.0012880563735961914, -0.0012331753969192505, -0.0011782944202423096, -0.0011234134435653687, -0.0010685324668884277, -0.0010136514902114868, -0.0009587705135345459, -0.000903889536857605, -0.0008490085601806641, -0.0007941275835037231, -0.0007392466068267822, -0.0006843656301498413, -0.0006294846534729004, -0.0005746036767959595, -0.0005197227001190186, -0.00046484172344207764, -0.0004099607467651367, -0.0003550797700881958, -0.0003001987934112549, -0.00024531781673431396, -0.00019043684005737305, -0.00013555586338043213, -8.067488670349121e-05, -2.5793910026550293e-05, 2.9087066650390625e-05, 8.396804332733154e-05, 0.00013884902000427246, 0.00019372999668121338, 0.0002486109733581543, 0.0003034919500350952, 0.00035837292671203613, 0.00041325390338897705, 0.00046813488006591797, 0.0005230158567428589, 0.0005778968334197998, 0.0006327778100967407, 0.0006876587867736816, 0.0007425397634506226, 0.0007974207401275635, 0.0008523017168045044, 0.0009071826934814453, 0.0009620636701583862, 0.0010169446468353271, 0.001071825623512268, 0.001126706600189209, 0.00118158757686615, 0.0012364685535430908, 0.0012913495302200317, 0.0013462305068969727, 0.0014011114835739136, 0.0014559924602508545, 0.0015108734369277954, 0.0015657544136047363, 0.0016206353902816772, 0.0016755163669586182, 0.001730397343635559, 0.0017852783203125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 6.0, 9.0, 10.0, 11.0, 4.0, 7.0, 15.0, 12.0, 15.0, 16.0, 31.0, 28.0, 37.0, 54.0, 88.0, 189.0, 113.0, 82.0, 56.0, 36.0, 29.0, 20.0, 21.0, 10.0, 21.0, 9.0, 8.0, 12.0, 0.0, 8.0, 7.0, 8.0, 2.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004897117614746094, -0.00047268718481063843, -0.0004556626081466675, -0.00043863803148269653, -0.0004216134548187256, -0.00040458887815475464, -0.0003875643014907837, -0.00037053972482681274, -0.0003535151481628418, -0.00033649057149887085, -0.0003194659948348999, -0.00030244141817092896, -0.000285416841506958, -0.00026839226484298706, -0.0002513676881790161, -0.00023434311151504517, -0.00021731853485107422, -0.00020029395818710327, -0.00018326938152313232, -0.00016624480485916138, -0.00014922022819519043, -0.00013219565153121948, -0.00011517107486724854, -9.814649820327759e-05, -8.112192153930664e-05, -6.40973448753357e-05, -4.7072768211364746e-05, -3.00481915473938e-05, -1.3023614883422852e-05, 4.000961780548096e-06, 2.1025538444519043e-05, 3.805011510848999e-05, 5.507469177246094e-05, 7.209926843643188e-05, 8.912384510040283e-05, 0.00010614842176437378, 0.00012317299842834473, 0.00014019757509231567, 0.00015722215175628662, 0.00017424672842025757, 0.00019127130508422852, 0.00020829588174819946, 0.0002253204584121704, 0.00024234503507614136, 0.0002593696117401123, 0.00027639418840408325, 0.0002934187650680542, 0.00031044334173202515, 0.0003274679183959961, 0.00034449249505996704, 0.000361517071723938, 0.00037854164838790894, 0.0003955662250518799, 0.00041259080171585083, 0.0004296153783798218, 0.0004466399550437927, 0.00046366453170776367, 0.0004806891083717346, 0.0004977136850357056, 0.0005147382616996765, 0.0005317628383636475, 0.0005487874150276184, 0.0005658119916915894, 0.0005828365683555603, 0.0005998611450195312]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 4.0, 2.0, 1.0, 0.0, 6.0, 6.0, 6.0, 8.0, 12.0, 14.0, 22.0, 25.0, 39.0, 53.0, 74.0, 87.0, 110.0, 144.0, 88.0, 52.0, 61.0, 41.0, 41.0, 27.0, 22.0, 14.0, 14.0, 7.0, 3.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05781896039843559, -0.055845148861408234, -0.053871337324380875, -0.051897525787353516, -0.04992371425032616, -0.0479499027132988, -0.04597609117627144, -0.04400227963924408, -0.04202846810221672, -0.04005465656518936, -0.038080845028162, -0.036107033491134644, -0.034133221954107285, -0.032159410417079926, -0.030185598880052567, -0.028211787343025208, -0.02623797580599785, -0.02426416426897049, -0.02229035273194313, -0.02031654119491577, -0.018342729657888412, -0.016368918120861053, -0.014395106583833694, -0.012421295046806335, -0.010447483509778976, -0.008473671972751617, -0.006499860435724258, -0.004526048898696899, -0.0025522373616695404, -0.0005784258246421814, 0.0013953857123851776, 0.0033691972494125366, 0.005343005061149597, 0.007316816598176956, 0.009290628135204315, 0.011264439672231674, 0.013238251209259033, 0.015212062746286392, 0.01718587428331375, 0.01915968582034111, 0.02113349735736847, 0.023107308894395828, 0.025081120431423187, 0.027054931968450546, 0.029028743505477905, 0.031002555042505264, 0.03297636657953262, 0.03495017811655998, 0.03692398965358734, 0.0388978011906147, 0.04087161272764206, 0.04284542426466942, 0.04481923580169678, 0.046793047338724136, 0.048766858875751495, 0.050740670412778854, 0.05271448194980621, 0.05468829348683357, 0.05666210502386093, 0.05863591656088829, 0.06060972809791565, 0.06258353590965271, 0.06455735117197037, 0.06653116643428802, 0.06850497424602509]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 8.0, 11.0, 12.0, 12.0, 12.0, 17.0, 31.0, 25.0, 32.0, 34.0, 35.0, 35.0, 43.0, 38.0, 53.0, 37.0, 46.0, 46.0, 44.0, 41.0, 40.0, 33.0, 41.0, 44.0, 34.0, 31.0, 25.0, 24.0, 12.0, 24.0, 17.0, 11.0, 12.0, 7.0, 13.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038585368543863297, -0.03726552799344063, -0.03594569116830826, -0.03462585061788559, -0.03330601006746292, -0.03198617324233055, -0.030666332691907883, -0.029346494004130363, -0.028026655316352844, -0.026706816628575325, -0.025386977940797806, -0.024067137390375137, -0.022747298702597618, -0.0214274600148201, -0.02010761946439743, -0.01878778077661991, -0.017467942088842392, -0.016148103401064873, -0.014828263781964779, -0.013508424162864685, -0.012188585475087166, -0.010868746787309647, -0.009548907168209553, -0.008229067549109459, -0.00690922886133194, -0.005589389707893133, -0.004269550554454327, -0.00294971140101552, -0.0016298722475767136, -0.00031003309413790703, 0.0010098060593008995, 0.0023296456784009933, 0.0036494843661785126, 0.004969323519617319, 0.006289162673056126, 0.007609001826494932, 0.008928840979933739, 0.010248679667711258, 0.011568519286811352, 0.012888358905911446, 0.014208197593688965, 0.015528036281466484, 0.016847874969244003, 0.018167715519666672, 0.01948755420744419, 0.02080739289522171, 0.02212723344564438, 0.023447072133421898, 0.024766910821199417, 0.026086749508976936, 0.027406588196754456, 0.028726428747177124, 0.030046267434954643, 0.03136610612273216, 0.03268594667315483, 0.0340057834982872, 0.03532562404870987, 0.03664546459913254, 0.03796530142426491, 0.039285141974687576, 0.040604978799819946, 0.041924819350242615, 0.04324465990066528, 0.04456450045108795, 0.04588433727622032]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 4.0, 8.0, 7.0, 10.0, 7.0, 14.0, 23.0, 31.0, 41.0, 60.0, 87.0, 162.0, 222.0, 324.0, 433.0, 702.0, 967.0, 1660.0, 2573.0, 3957.0, 6157.0, 9850.0, 15969.0, 27042.0, 45784.0, 81678.0, 165090.0, 311416.0, 171617.0, 84389.0, 46785.0, 27388.0, 16489.0, 9923.0, 6362.0, 3957.0, 2529.0, 1568.0, 1074.0, 778.0, 441.0, 314.0, 236.0, 133.0, 102.0, 66.0, 59.0, 20.0, 16.0, 17.0, 8.0, 5.0, 5.0, 1.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.078125, -0.07556533813476562, -0.07300567626953125, -0.07044601440429688, -0.0678863525390625, -0.06532669067382812, -0.06276702880859375, -0.060207366943359375, -0.057647705078125, -0.055088043212890625, -0.05252838134765625, -0.049968719482421875, -0.0474090576171875, -0.044849395751953125, -0.04228973388671875, -0.039730072021484375, -0.03717041015625, -0.034610748291015625, -0.03205108642578125, -0.029491424560546875, -0.0269317626953125, -0.024372100830078125, -0.02181243896484375, -0.019252777099609375, -0.016693115234375, -0.014133453369140625, -0.01157379150390625, -0.009014129638671875, -0.0064544677734375, -0.003894805908203125, -0.00133514404296875, 0.001224517822265625, 0.0037841796875, 0.006343841552734375, 0.00890350341796875, 0.011463165283203125, 0.0140228271484375, 0.016582489013671875, 0.01914215087890625, 0.021701812744140625, 0.024261474609375, 0.026821136474609375, 0.02938079833984375, 0.031940460205078125, 0.0345001220703125, 0.037059783935546875, 0.03961944580078125, 0.042179107666015625, 0.04473876953125, 0.047298431396484375, 0.04985809326171875, 0.052417755126953125, 0.0549774169921875, 0.057537078857421875, 0.06009674072265625, 0.06265640258789062, 0.065216064453125, 0.06777572631835938, 0.07033538818359375, 0.07289505004882812, 0.0754547119140625, 0.07801437377929688, 0.08057403564453125, 0.08313369750976562, 0.085693359375]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 8.0, 12.0, 5.0, 9.0, 15.0, 17.0, 23.0, 23.0, 21.0, 26.0, 47.0, 39.0, 40.0, 47.0, 47.0, 40.0, 44.0, 40.0, 57.0, 45.0, 36.0, 47.0, 38.0, 42.0, 38.0, 36.0, 22.0, 20.0, 17.0, 20.0, 23.0, 9.0, 14.0, 6.0, 9.0, 8.0, 3.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03509521484375, -0.03386974334716797, -0.03264427185058594, -0.031418800354003906, -0.030193328857421875, -0.028967857360839844, -0.027742385864257812, -0.02651691436767578, -0.02529144287109375, -0.02406597137451172, -0.022840499877929688, -0.021615028381347656, -0.020389556884765625, -0.019164085388183594, -0.017938613891601562, -0.01671314239501953, -0.0154876708984375, -0.014262199401855469, -0.013036727905273438, -0.011811256408691406, -0.010585784912109375, -0.009360313415527344, -0.008134841918945312, -0.006909370422363281, -0.00568389892578125, -0.004458427429199219, -0.0032329559326171875, -0.0020074844360351562, -0.000782012939453125, 0.00044345855712890625, 0.0016689300537109375, 0.0028944015502929688, 0.004119873046875, 0.005345344543457031, 0.0065708160400390625, 0.007796287536621094, 0.009021759033203125, 0.010247230529785156, 0.011472702026367188, 0.012698173522949219, 0.01392364501953125, 0.015149116516113281, 0.016374588012695312, 0.017600059509277344, 0.018825531005859375, 0.020051002502441406, 0.021276473999023438, 0.02250194549560547, 0.0237274169921875, 0.02495288848876953, 0.026178359985351562, 0.027403831481933594, 0.028629302978515625, 0.029854774475097656, 0.031080245971679688, 0.03230571746826172, 0.03353118896484375, 0.03475666046142578, 0.03598213195800781, 0.037207603454589844, 0.038433074951171875, 0.039658546447753906, 0.04088401794433594, 0.04210948944091797, 0.0433349609375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 5.0, 2.0, 2.0, 5.0, 11.0, 7.0, 17.0, 40.0, 48.0, 62.0, 74.0, 123.0, 186.0, 249.0, 438.0, 533.0, 841.0, 1306.0, 1989.0, 2909.0, 4535.0, 7092.0, 11114.0, 17610.0, 28868.0, 48486.0, 84748.0, 159931.0, 298170.0, 164124.0, 86200.0, 49848.0, 29272.0, 18036.0, 11147.0, 7075.0, 4539.0, 2949.0, 1961.0, 1268.0, 889.0, 594.0, 390.0, 249.0, 197.0, 132.0, 88.0, 67.0, 44.0, 30.0, 16.0, 13.0, 16.0, 7.0, 8.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.075439453125, -0.07304573059082031, -0.07065200805664062, -0.06825828552246094, -0.06586456298828125, -0.06347084045410156, -0.061077117919921875, -0.05868339538574219, -0.0562896728515625, -0.05389595031738281, -0.051502227783203125, -0.04910850524902344, -0.04671478271484375, -0.04432106018066406, -0.041927337646484375, -0.03953361511230469, -0.037139892578125, -0.03474617004394531, -0.032352447509765625, -0.029958724975585938, -0.02756500244140625, -0.025171279907226562, -0.022777557373046875, -0.020383834838867188, -0.0179901123046875, -0.015596389770507812, -0.013202667236328125, -0.010808944702148438, -0.00841522216796875, -0.0060214996337890625, -0.003627777099609375, -0.0012340545654296875, 0.00115966796875, 0.0035533905029296875, 0.005947113037109375, 0.008340835571289062, 0.01073455810546875, 0.013128280639648438, 0.015522003173828125, 0.017915725708007812, 0.0203094482421875, 0.022703170776367188, 0.025096893310546875, 0.027490615844726562, 0.02988433837890625, 0.03227806091308594, 0.034671783447265625, 0.03706550598144531, 0.039459228515625, 0.04185295104980469, 0.044246673583984375, 0.04664039611816406, 0.04903411865234375, 0.05142784118652344, 0.053821563720703125, 0.05621528625488281, 0.0586090087890625, 0.06100273132324219, 0.06339645385742188, 0.06579017639160156, 0.06818389892578125, 0.07057762145996094, 0.07297134399414062, 0.07536506652832031, 0.0777587890625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 0.0, 3.0, 2.0, 2.0, 4.0, 8.0, 2.0, 8.0, 10.0, 15.0, 17.0, 14.0, 19.0, 24.0, 23.0, 28.0, 33.0, 35.0, 33.0, 37.0, 36.0, 33.0, 51.0, 40.0, 36.0, 53.0, 37.0, 45.0, 46.0, 35.0, 31.0, 26.0, 31.0, 35.0, 22.0, 24.0, 20.0, 17.0, 15.0, 12.0, 10.0, 5.0, 9.0, 3.0, 3.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0229339599609375, -0.022221088409423828, -0.021508216857910156, -0.020795345306396484, -0.020082473754882812, -0.01936960220336914, -0.01865673065185547, -0.017943859100341797, -0.017230987548828125, -0.016518115997314453, -0.01580524444580078, -0.01509237289428711, -0.014379501342773438, -0.013666629791259766, -0.012953758239746094, -0.012240886688232422, -0.01152801513671875, -0.010815143585205078, -0.010102272033691406, -0.009389400482177734, -0.008676528930664062, -0.00796365737915039, -0.007250785827636719, -0.006537914276123047, -0.005825042724609375, -0.005112171173095703, -0.004399299621582031, -0.0036864280700683594, -0.0029735565185546875, -0.0022606849670410156, -0.0015478134155273438, -0.0008349418640136719, -0.0001220703125, 0.0005908012390136719, 0.0013036727905273438, 0.0020165443420410156, 0.0027294158935546875, 0.0034422874450683594, 0.004155158996582031, 0.004868030548095703, 0.005580902099609375, 0.006293773651123047, 0.007006645202636719, 0.007719516754150391, 0.008432388305664062, 0.009145259857177734, 0.009858131408691406, 0.010571002960205078, 0.01128387451171875, 0.011996746063232422, 0.012709617614746094, 0.013422489166259766, 0.014135360717773438, 0.01484823226928711, 0.015561103820800781, 0.016273975372314453, 0.016986846923828125, 0.017699718475341797, 0.01841259002685547, 0.01912546157836914, 0.019838333129882812, 0.020551204681396484, 0.021264076232910156, 0.021976947784423828, 0.0226898193359375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 10.0, 3.0, 8.0, 10.0, 11.0, 15.0, 15.0, 18.0, 31.0, 63.0, 69.0, 90.0, 139.0, 217.0, 315.0, 578.0, 958.0, 1638.0, 2981.0, 5674.0, 12261.0, 37713.0, 853471.0, 96266.0, 18752.0, 7990.0, 4003.0, 2128.0, 1217.0, 687.0, 411.0, 237.0, 176.0, 131.0, 74.0, 58.0, 31.0, 27.0, 25.0, 17.0, 14.0, 8.0, 4.0, 4.0, 5.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.013458251953125, -0.013046979904174805, -0.01263570785522461, -0.012224435806274414, -0.011813163757324219, -0.011401891708374023, -0.010990619659423828, -0.010579347610473633, -0.010168075561523438, -0.009756803512573242, -0.009345531463623047, -0.008934259414672852, -0.008522987365722656, -0.008111715316772461, -0.007700443267822266, -0.00728917121887207, -0.006877899169921875, -0.00646662712097168, -0.006055355072021484, -0.005644083023071289, -0.005232810974121094, -0.0048215389251708984, -0.004410266876220703, -0.003998994827270508, -0.0035877227783203125, -0.003176450729370117, -0.002765178680419922, -0.0023539066314697266, -0.0019426345825195312, -0.001531362533569336, -0.0011200904846191406, -0.0007088184356689453, -0.00029754638671875, 0.00011372566223144531, 0.0005249977111816406, 0.0009362697601318359, 0.0013475418090820312, 0.0017588138580322266, 0.002170085906982422, 0.002581357955932617, 0.0029926300048828125, 0.003403902053833008, 0.003815174102783203, 0.0042264461517333984, 0.004637718200683594, 0.005048990249633789, 0.005460262298583984, 0.00587153434753418, 0.006282806396484375, 0.00669407844543457, 0.007105350494384766, 0.007516622543334961, 0.007927894592285156, 0.008339166641235352, 0.008750438690185547, 0.009161710739135742, 0.009572982788085938, 0.009984254837036133, 0.010395526885986328, 0.010806798934936523, 0.011218070983886719, 0.011629343032836914, 0.01204061508178711, 0.012451887130737305, 0.0128631591796875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 7.0, 0.0, 8.0, 0.0, 0.0, 13.0, 0.0, 19.0, 0.0, 34.0, 0.0, 57.0, 0.0, 0.0, 84.0, 0.0, 90.0, 0.0, 136.0, 0.0, 0.0, 117.0, 0.0, 132.0, 0.0, 111.0, 0.0, 68.0, 0.0, 0.0, 40.0, 0.0, 35.0, 0.0, 22.0, 0.0, 0.0, 14.0, 0.0, 13.0, 0.0, 7.0, 0.0, 2.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.344650268554688e-07, -8.083879947662354e-07, -7.82310962677002e-07, -7.562339305877686e-07, -7.301568984985352e-07, -7.040798664093018e-07, -6.780028343200684e-07, -6.51925802230835e-07, -6.258487701416016e-07, -5.997717380523682e-07, -5.736947059631348e-07, -5.476176738739014e-07, -5.21540641784668e-07, -4.954636096954346e-07, -4.6938657760620117e-07, -4.4330954551696777e-07, -4.172325134277344e-07, -3.91155481338501e-07, -3.650784492492676e-07, -3.390014171600342e-07, -3.129243850708008e-07, -2.868473529815674e-07, -2.60770320892334e-07, -2.3469328880310059e-07, -2.086162567138672e-07, -1.825392246246338e-07, -1.564621925354004e-07, -1.30385160446167e-07, -1.043081283569336e-07, -7.82310962677002e-08, -5.21540641784668e-08, -2.60770320892334e-08, 0.0, 2.60770320892334e-08, 5.21540641784668e-08, 7.82310962677002e-08, 1.043081283569336e-07, 1.30385160446167e-07, 1.564621925354004e-07, 1.825392246246338e-07, 2.086162567138672e-07, 2.3469328880310059e-07, 2.60770320892334e-07, 2.868473529815674e-07, 3.129243850708008e-07, 3.390014171600342e-07, 3.650784492492676e-07, 3.91155481338501e-07, 4.172325134277344e-07, 4.4330954551696777e-07, 4.6938657760620117e-07, 4.954636096954346e-07, 5.21540641784668e-07, 5.476176738739014e-07, 5.736947059631348e-07, 5.997717380523682e-07, 6.258487701416016e-07, 6.51925802230835e-07, 6.780028343200684e-07, 7.040798664093018e-07, 7.301568984985352e-07, 7.562339305877686e-07, 7.82310962677002e-07, 8.083879947662354e-07, 8.344650268554688e-07]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 9.0, 7.0, 11.0, 15.0, 18.0, 33.0, 44.0, 56.0, 87.0, 101.0, 134.0, 220.0, 298.0, 478.0, 615.0, 940.0, 1346.0, 2043.0, 3231.0, 4785.0, 7955.0, 14835.0, 36676.0, 796691.0, 123561.0, 24026.0, 11539.0, 6445.0, 4089.0, 2732.0, 1707.0, 1133.0, 795.0, 592.0, 381.0, 262.0, 202.0, 140.0, 87.0, 72.0, 41.0, 39.0, 24.0, 14.0, 18.0, 10.0, 10.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0111846923828125, -0.010833024978637695, -0.01048135757446289, -0.010129690170288086, -0.009778022766113281, -0.009426355361938477, -0.009074687957763672, -0.008723020553588867, -0.008371353149414062, -0.008019685745239258, -0.007668018341064453, -0.0073163509368896484, -0.006964683532714844, -0.006613016128540039, -0.006261348724365234, -0.00590968132019043, -0.005558013916015625, -0.00520634651184082, -0.004854679107666016, -0.004503011703491211, -0.004151344299316406, -0.0037996768951416016, -0.003448009490966797, -0.003096342086791992, -0.0027446746826171875, -0.002393007278442383, -0.002041339874267578, -0.0016896724700927734, -0.0013380050659179688, -0.000986337661743164, -0.0006346702575683594, -0.0002830028533935547, 6.866455078125e-05, 0.0004203319549560547, 0.0007719993591308594, 0.001123666763305664, 0.0014753341674804688, 0.0018270015716552734, 0.002178668975830078, 0.002530336380004883, 0.0028820037841796875, 0.003233671188354492, 0.003585338592529297, 0.0039370059967041016, 0.004288673400878906, 0.004640340805053711, 0.004992008209228516, 0.00534367561340332, 0.005695343017578125, 0.00604701042175293, 0.006398677825927734, 0.006750345230102539, 0.007102012634277344, 0.0074536800384521484, 0.007805347442626953, 0.008157014846801758, 0.008508682250976562, 0.008860349655151367, 0.009212017059326172, 0.009563684463500977, 0.009915351867675781, 0.010267019271850586, 0.01061868667602539, 0.010970354080200195, 0.011322021484375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 1.0, 1.0, 5.0, 4.0, 6.0, 7.0, 9.0, 9.0, 15.0, 30.0, 29.0, 74.0, 477.0, 200.0, 42.0, 19.0, 7.0, 10.0, 11.0, 5.0, 5.0, 7.0, 3.0, 3.0, 3.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003452301025390625, -0.003343820571899414, -0.003235340118408203, -0.003126859664916992, -0.0030183792114257812, -0.0029098987579345703, -0.0028014183044433594, -0.0026929378509521484, -0.0025844573974609375, -0.0024759769439697266, -0.0023674964904785156, -0.0022590160369873047, -0.0021505355834960938, -0.002042055130004883, -0.0019335746765136719, -0.001825094223022461, -0.00171661376953125, -0.001608133316040039, -0.0014996528625488281, -0.0013911724090576172, -0.0012826919555664062, -0.0011742115020751953, -0.0010657310485839844, -0.0009572505950927734, -0.0008487701416015625, -0.0007402896881103516, -0.0006318092346191406, -0.0005233287811279297, -0.00041484832763671875, -0.0003063678741455078, -0.00019788742065429688, -8.940696716308594e-05, 1.9073486328125e-05, 0.00012755393981933594, 0.00023603439331054688, 0.0003445148468017578, 0.00045299530029296875, 0.0005614757537841797, 0.0006699562072753906, 0.0007784366607666016, 0.0008869171142578125, 0.0009953975677490234, 0.0011038780212402344, 0.0012123584747314453, 0.0013208389282226562, 0.0014293193817138672, 0.0015377998352050781, 0.001646280288696289, 0.0017547607421875, 0.001863241195678711, 0.001971721649169922, 0.002080202102661133, 0.0021886825561523438, 0.0022971630096435547, 0.0024056434631347656, 0.0025141239166259766, 0.0026226043701171875, 0.0027310848236083984, 0.0028395652770996094, 0.0029480457305908203, 0.0030565261840820312, 0.003165006637573242, 0.003273487091064453, 0.003381967544555664, 0.003490447998046875]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 0.0, 9.0, 7.0, 20.0, 11.0, 12.0, 26.0, 34.0, 59.0, 82.0, 105.0, 131.0, 145.0, 86.0, 71.0, 63.0, 37.0, 18.0, 21.0, 16.0, 12.0, 11.0, 11.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06294828653335571, -0.060916438698768616, -0.05888458713889122, -0.056852735579013824, -0.05482088774442673, -0.05278903990983963, -0.050757188349962234, -0.04872533679008484, -0.04669348895549774, -0.044661641120910645, -0.04262978956103325, -0.04059793800115585, -0.038566090166568756, -0.03653424233198166, -0.03450239077210426, -0.03247053921222687, -0.03043869137763977, -0.028406841680407524, -0.026374991983175278, -0.02434314228594303, -0.022311292588710785, -0.02027944289147854, -0.018247593194246292, -0.016215743497014046, -0.0141838937997818, -0.012152044102549553, -0.010120194405317307, -0.00808834470808506, -0.006056495010852814, -0.004024645313620567, -0.001992795616388321, 3.9054080843925476e-05, 0.002070896327495575, 0.004102746024727821, 0.006134595721960068, 0.008166445419192314, 0.01019829511642456, 0.012230144813656807, 0.014261994510889053, 0.0162938442081213, 0.018325693905353546, 0.020357543602585793, 0.02238939329981804, 0.024421242997050285, 0.026453092694282532, 0.028484942391514778, 0.030516792088747025, 0.03254864364862442, 0.03458049148321152, 0.036612339317798615, 0.03864419087767601, 0.040676042437553406, 0.0427078902721405, 0.0447397381067276, 0.046771589666604996, 0.04880344122648239, 0.05083528906106949, 0.052867136895656586, 0.05489898845553398, 0.05693084001541138, 0.058962687849998474, 0.06099453568458557, 0.06302638351917267, 0.06505823880434036, 0.06709008663892746]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 3.0, 4.0, 5.0, 7.0, 5.0, 10.0, 14.0, 19.0, 16.0, 19.0, 18.0, 27.0, 26.0, 28.0, 28.0, 42.0, 32.0, 37.0, 32.0, 37.0, 40.0, 35.0, 42.0, 38.0, 35.0, 35.0, 43.0, 35.0, 38.0, 34.0, 32.0, 20.0, 28.0, 27.0, 18.0, 15.0, 14.0, 17.0, 11.0, 6.0, 7.0, 8.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032039523124694824, -0.030944867059588432, -0.02985021099448204, -0.02875555492937565, -0.027660898864269257, -0.026566242799162865, -0.025471586734056473, -0.02437693066895008, -0.02328227460384369, -0.022187618538737297, -0.021092962473630905, -0.019998306408524513, -0.01890365034341812, -0.01780899427831173, -0.016714338213205338, -0.015619682148098946, -0.014525026082992554, -0.013430370017886162, -0.01233571395277977, -0.011241057887673378, -0.010146401822566986, -0.009051745757460594, -0.007957089692354202, -0.00686243362724781, -0.0057677775621414185, -0.0046731214970350266, -0.0035784654319286346, -0.0024838093668222427, -0.0013891533017158508, -0.0002944972366094589, 0.000800158828496933, 0.0018948148936033249, 0.0029894746840000153, 0.004084130749106407, 0.005178786814212799, 0.006273442879319191, 0.007368098944425583, 0.008462755009531975, 0.009557411074638367, 0.010652067139744759, 0.01174672320485115, 0.012841379269957542, 0.013936035335063934, 0.015030691400170326, 0.016125347465276718, 0.01722000353038311, 0.018314659595489502, 0.019409315660595894, 0.020503971725702286, 0.021598627790808678, 0.02269328385591507, 0.02378793992102146, 0.024882595986127853, 0.025977252051234245, 0.027071908116340637, 0.02816656418144703, 0.02926122024655342, 0.030355876311659813, 0.031450532376766205, 0.03254518657922745, 0.03363984450697899, 0.03473450243473053, 0.03582915663719177, 0.036923810839653015, 0.038018468767404556]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 7.0, 14.0, 10.0, 25.0, 31.0, 39.0, 47.0, 70.0, 98.0, 134.0, 167.0, 226.0, 299.0, 358.0, 477.0, 695.0, 898.0, 1301.0, 1762.0, 2478.0, 3492.0, 4911.0, 7484.0, 11185.0, 16986.0, 26885.0, 43618.0, 75149.0, 137432.0, 316982.0, 1141802.0, 1558916.0, 440058.0, 172556.0, 88240.0, 49628.0, 29834.0, 18970.0, 12471.0, 8325.0, 5732.0, 4071.0, 2808.0, 2062.0, 1571.0, 1017.0, 785.0, 558.0, 422.0, 338.0, 244.0, 190.0, 134.0, 83.0, 68.0, 44.0, 44.0, 20.0, 20.0, 10.0, 12.0, 4.0], "bins": [-0.045074462890625, -0.04371452331542969, -0.042354583740234375, -0.04099464416503906, -0.03963470458984375, -0.03827476501464844, -0.036914825439453125, -0.03555488586425781, -0.0341949462890625, -0.03283500671386719, -0.031475067138671875, -0.030115127563476562, -0.02875518798828125, -0.027395248413085938, -0.026035308837890625, -0.024675369262695312, -0.0233154296875, -0.021955490112304688, -0.020595550537109375, -0.019235610961914062, -0.01787567138671875, -0.016515731811523438, -0.015155792236328125, -0.013795852661132812, -0.0124359130859375, -0.011075973510742188, -0.009716033935546875, -0.008356094360351562, -0.00699615478515625, -0.0056362152099609375, -0.004276275634765625, -0.0029163360595703125, -0.001556396484375, -0.0001964569091796875, 0.001163482666015625, 0.0025234222412109375, 0.00388336181640625, 0.0052433013916015625, 0.006603240966796875, 0.007963180541992188, 0.0093231201171875, 0.010683059692382812, 0.012042999267578125, 0.013402938842773438, 0.01476287841796875, 0.016122817993164062, 0.017482757568359375, 0.018842697143554688, 0.02020263671875, 0.021562576293945312, 0.022922515869140625, 0.024282455444335938, 0.02564239501953125, 0.027002334594726562, 0.028362274169921875, 0.029722213745117188, 0.0310821533203125, 0.03244209289550781, 0.033802032470703125, 0.03516197204589844, 0.03652191162109375, 0.03788185119628906, 0.039241790771484375, 0.04060173034667969, 0.041961669921875]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 0.0, 5.0, 4.0, 5.0, 9.0, 5.0, 11.0, 11.0, 12.0, 20.0, 22.0, 29.0, 25.0, 27.0, 36.0, 26.0, 38.0, 30.0, 31.0, 33.0, 40.0, 37.0, 60.0, 37.0, 35.0, 47.0, 48.0, 29.0, 44.0, 30.0, 31.0, 22.0, 22.0, 27.0, 20.0, 17.0, 16.0, 13.0, 10.0, 12.0, 5.0, 3.0, 5.0, 4.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0200042724609375, -0.019349336624145508, -0.018694400787353516, -0.018039464950561523, -0.01738452911376953, -0.01672959327697754, -0.016074657440185547, -0.015419721603393555, -0.014764785766601562, -0.01410984992980957, -0.013454914093017578, -0.012799978256225586, -0.012145042419433594, -0.011490106582641602, -0.01083517074584961, -0.010180234909057617, -0.009525299072265625, -0.008870363235473633, -0.00821542739868164, -0.0075604915618896484, -0.006905555725097656, -0.006250619888305664, -0.005595684051513672, -0.00494074821472168, -0.0042858123779296875, -0.0036308765411376953, -0.002975940704345703, -0.002321004867553711, -0.0016660690307617188, -0.0010111331939697266, -0.0003561973571777344, 0.0002987384796142578, 0.00095367431640625, 0.0016086101531982422, 0.0022635459899902344, 0.0029184818267822266, 0.0035734176635742188, 0.004228353500366211, 0.004883289337158203, 0.005538225173950195, 0.0061931610107421875, 0.00684809684753418, 0.007503032684326172, 0.008157968521118164, 0.008812904357910156, 0.009467840194702148, 0.01012277603149414, 0.010777711868286133, 0.011432647705078125, 0.012087583541870117, 0.01274251937866211, 0.013397455215454102, 0.014052391052246094, 0.014707326889038086, 0.015362262725830078, 0.01601719856262207, 0.016672134399414062, 0.017327070236206055, 0.017982006072998047, 0.01863694190979004, 0.01929187774658203, 0.019946813583374023, 0.020601749420166016, 0.021256685256958008, 0.02191162109375]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 6.0, 10.0, 13.0, 22.0, 39.0, 64.0, 97.0, 176.0, 305.0, 545.0, 876.0, 1508.0, 2588.0, 4494.0, 7990.0, 15214.0, 29299.0, 61404.0, 138322.0, 364562.0, 1374201.0, 1524691.0, 390312.0, 147328.0, 64113.0, 30646.0, 15830.0, 8541.0, 4757.0, 2732.0, 1521.0, 845.0, 477.0, 274.0, 182.0, 109.0, 56.0, 42.0, 27.0, 32.0, 16.0, 9.0, 4.0, 5.0, 5.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.057952880859375, -0.05634450912475586, -0.05473613739013672, -0.05312776565551758, -0.05151939392089844, -0.0499110221862793, -0.048302650451660156, -0.046694278717041016, -0.045085906982421875, -0.043477535247802734, -0.041869163513183594, -0.04026079177856445, -0.03865242004394531, -0.03704404830932617, -0.03543567657470703, -0.03382730484008789, -0.03221893310546875, -0.03061056137084961, -0.02900218963623047, -0.027393817901611328, -0.025785446166992188, -0.024177074432373047, -0.022568702697753906, -0.020960330963134766, -0.019351959228515625, -0.017743587493896484, -0.016135215759277344, -0.014526844024658203, -0.012918472290039062, -0.011310100555419922, -0.009701728820800781, -0.00809335708618164, -0.0064849853515625, -0.004876613616943359, -0.0032682418823242188, -0.0016598701477050781, -5.14984130859375e-05, 0.0015568733215332031, 0.0031652450561523438, 0.004773616790771484, 0.006381988525390625, 0.007990360260009766, 0.009598731994628906, 0.011207103729248047, 0.012815475463867188, 0.014423847198486328, 0.01603221893310547, 0.01764059066772461, 0.01924896240234375, 0.02085733413696289, 0.02246570587158203, 0.024074077606201172, 0.025682449340820312, 0.027290821075439453, 0.028899192810058594, 0.030507564544677734, 0.032115936279296875, 0.033724308013916016, 0.035332679748535156, 0.0369410514831543, 0.03854942321777344, 0.04015779495239258, 0.04176616668701172, 0.04337453842163086, 0.04498291015625]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 7.0, 9.0, 4.0, 9.0, 15.0, 14.0, 25.0, 26.0, 30.0, 32.0, 38.0, 46.0, 58.0, 87.0, 115.0, 123.0, 156.0, 176.0, 194.0, 242.0, 272.0, 362.0, 361.0, 280.0, 236.0, 217.0, 175.0, 157.0, 106.0, 118.0, 66.0, 62.0, 53.0, 34.0, 32.0, 30.0, 28.0, 18.0, 11.0, 10.0, 13.0, 3.0, 7.0, 8.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.01300048828125, -0.012629032135009766, -0.012257575988769531, -0.011886119842529297, -0.011514663696289062, -0.011143207550048828, -0.010771751403808594, -0.01040029525756836, -0.010028839111328125, -0.00965738296508789, -0.009285926818847656, -0.008914470672607422, -0.008543014526367188, -0.008171558380126953, -0.007800102233886719, -0.007428646087646484, -0.00705718994140625, -0.006685733795166016, -0.006314277648925781, -0.005942821502685547, -0.0055713653564453125, -0.005199909210205078, -0.004828453063964844, -0.004456996917724609, -0.004085540771484375, -0.0037140846252441406, -0.0033426284790039062, -0.002971172332763672, -0.0025997161865234375, -0.002228260040283203, -0.0018568038940429688, -0.0014853477478027344, -0.0011138916015625, -0.0007424354553222656, -0.00037097930908203125, 4.76837158203125e-07, 0.0003719329833984375, 0.0007433891296386719, 0.0011148452758789062, 0.0014863014221191406, 0.001857757568359375, 0.0022292137145996094, 0.0026006698608398438, 0.002972126007080078, 0.0033435821533203125, 0.003715038299560547, 0.004086494445800781, 0.004457950592041016, 0.00482940673828125, 0.005200862884521484, 0.005572319030761719, 0.005943775177001953, 0.0063152313232421875, 0.006686687469482422, 0.007058143615722656, 0.007429599761962891, 0.007801055908203125, 0.00817251205444336, 0.008543968200683594, 0.008915424346923828, 0.009286880493164062, 0.009658336639404297, 0.010029792785644531, 0.010401248931884766, 0.010772705078125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 6.0, 7.0, 5.0, 12.0, 19.0, 28.0, 30.0, 30.0, 56.0, 77.0, 90.0, 134.0, 117.0, 117.0, 60.0, 47.0, 41.0, 34.0, 24.0, 14.0, 17.0, 10.0, 7.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03981098160147667, -0.038569264113903046, -0.03732754662632942, -0.0360858291387558, -0.034844111651182175, -0.03360239416360855, -0.03236067667603493, -0.031118961051106453, -0.02987724356353283, -0.028635526075959206, -0.027393808588385582, -0.02615209110081196, -0.024910375475883484, -0.02366865798830986, -0.022426940500736237, -0.021185223013162613, -0.01994350552558899, -0.018701788038015366, -0.017460070550441742, -0.01621835306286812, -0.01497663650661707, -0.013734919019043446, -0.012493202462792397, -0.011251484975218773, -0.01000976748764515, -0.008768050000071526, -0.007526332978159189, -0.006284615956246853, -0.005042898468673229, -0.0038011809810996056, -0.002559463959187269, -0.0013177469372749329, -7.60294497013092e-05, 0.0011656878050416708, 0.002407405059784651, 0.003649122314527631, 0.004890839569270611, 0.0061325570568442345, 0.007374274078756571, 0.008615991100668907, 0.00985770858824253, 0.011099426075816154, 0.012341143563389778, 0.013582860119640827, 0.01482457760721445, 0.0160662941634655, 0.017308011651039124, 0.018549729138612747, 0.01979144662618637, 0.021033164113759995, 0.022274881601333618, 0.023516599088907242, 0.024758316576480865, 0.02600003406405449, 0.027241749688982964, 0.028483467176556587, 0.02972518466413021, 0.030966902151703835, 0.03220861777663231, 0.03345033526420593, 0.034692052751779556, 0.03593377023935318, 0.037175487726926804, 0.03841720521450043, 0.03965892270207405]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 4.0, 4.0, 3.0, 7.0, 10.0, 12.0, 13.0, 13.0, 14.0, 17.0, 20.0, 21.0, 21.0, 27.0, 32.0, 38.0, 26.0, 36.0, 23.0, 36.0, 42.0, 39.0, 33.0, 30.0, 26.0, 42.0, 42.0, 30.0, 31.0, 27.0, 26.0, 35.0, 32.0, 22.0, 29.0, 25.0, 12.0, 20.0, 14.0, 11.0, 12.0, 13.0, 9.0, 5.0, 3.0, 8.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.018741626292467117, -0.018107404932379723, -0.017473183572292328, -0.016838964074850082, -0.016204742714762688, -0.015570521354675293, -0.014936300925910473, -0.014302080497145653, -0.013667859137058258, -0.013033637776970863, -0.012399417348206043, -0.011765196919441223, -0.011130975559353828, -0.010496754199266434, -0.009862533770501614, -0.009228313341736794, -0.008594091981649399, -0.007959870621562004, -0.007325650192797184, -0.006691429298371077, -0.006057208403944969, -0.005422987509518862, -0.004788766615092754, -0.004154545720666647, -0.0035203248262405396, -0.002886103931814432, -0.0022518830373883247, -0.0016176621429622173, -0.00098344124853611, -0.0003492203541100025, 0.0002850005403161049, 0.0009192214347422123, 0.0015534404665231705, 0.002187661360949278, 0.0028218822553753853, 0.0034561031498014927, 0.0040903240442276, 0.0047245449386537075, 0.005358765833079815, 0.005992986727505922, 0.00662720762193203, 0.007261428516358137, 0.007895649410784245, 0.008529869839549065, 0.00916409119963646, 0.009798312559723854, 0.010432532988488674, 0.011066753417253494, 0.011700974777340889, 0.012335196137428284, 0.012969416566193104, 0.013603636994957924, 0.014237858355045319, 0.014872079715132713, 0.015506300143897533, 0.016140520572662354, 0.016774741932749748, 0.017408963292837143, 0.01804318279027939, 0.018677404150366783, 0.019311625510454178, 0.019945846870541573, 0.020580068230628967, 0.021214287728071213, 0.021848509088158607]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 2.0, 8.0, 15.0, 16.0, 24.0, 45.0, 61.0, 84.0, 123.0, 178.0, 251.0, 374.0, 567.0, 872.0, 1421.0, 2206.0, 3529.0, 5750.0, 9794.0, 16791.0, 29748.0, 56770.0, 121922.0, 312605.0, 265461.0, 104680.0, 50430.0, 26820.0, 14940.0, 8727.0, 5197.0, 3211.0, 2051.0, 1330.0, 841.0, 552.0, 419.0, 217.0, 165.0, 108.0, 63.0, 56.0, 40.0, 38.0, 25.0, 3.0, 16.0, 6.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0081024169921875, -0.007840275764465332, -0.007578134536743164, -0.007315993309020996, -0.007053852081298828, -0.00679171085357666, -0.006529569625854492, -0.006267428398132324, -0.006005287170410156, -0.005743145942687988, -0.00548100471496582, -0.005218863487243652, -0.004956722259521484, -0.004694581031799316, -0.0044324398040771484, -0.0041702985763549805, -0.0039081573486328125, -0.0036460161209106445, -0.0033838748931884766, -0.0031217336654663086, -0.0028595924377441406, -0.0025974512100219727, -0.0023353099822998047, -0.0020731687545776367, -0.0018110275268554688, -0.0015488862991333008, -0.0012867450714111328, -0.0010246038436889648, -0.0007624626159667969, -0.0005003213882446289, -0.00023818016052246094, 2.396106719970703e-05, 0.000286102294921875, 0.000548243522644043, 0.0008103847503662109, 0.001072525978088379, 0.0013346672058105469, 0.0015968084335327148, 0.0018589496612548828, 0.0021210908889770508, 0.0023832321166992188, 0.0026453733444213867, 0.0029075145721435547, 0.0031696557998657227, 0.0034317970275878906, 0.0036939382553100586, 0.0039560794830322266, 0.0042182207107543945, 0.0044803619384765625, 0.0047425031661987305, 0.0050046443939208984, 0.005266785621643066, 0.005528926849365234, 0.005791068077087402, 0.00605320930480957, 0.006315350532531738, 0.006577491760253906, 0.006839632987976074, 0.007101774215698242, 0.00736391544342041, 0.007626056671142578, 0.007888197898864746, 0.008150339126586914, 0.008412480354309082, 0.00867462158203125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 1.0, 5.0, 5.0, 5.0, 4.0, 12.0, 11.0, 12.0, 11.0, 14.0, 15.0, 17.0, 23.0, 26.0, 32.0, 30.0, 47.0, 23.0, 26.0, 40.0, 40.0, 36.0, 42.0, 30.0, 35.0, 39.0, 46.0, 29.0, 34.0, 40.0, 27.0, 29.0, 30.0, 26.0, 31.0, 23.0, 17.0, 11.0, 16.0, 13.0, 10.0, 8.0, 12.0, 3.0, 6.0, 4.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.021148681640625, -0.020461320877075195, -0.01977396011352539, -0.019086599349975586, -0.01839923858642578, -0.017711877822875977, -0.017024517059326172, -0.016337156295776367, -0.015649795532226562, -0.014962434768676758, -0.014275074005126953, -0.013587713241577148, -0.012900352478027344, -0.012212991714477539, -0.011525630950927734, -0.01083827018737793, -0.010150909423828125, -0.00946354866027832, -0.008776187896728516, -0.008088827133178711, -0.007401466369628906, -0.0067141056060791016, -0.006026744842529297, -0.005339384078979492, -0.0046520233154296875, -0.003964662551879883, -0.003277301788330078, -0.0025899410247802734, -0.0019025802612304688, -0.001215219497680664, -0.0005278587341308594, 0.0001595020294189453, 0.00084686279296875, 0.0015342235565185547, 0.0022215843200683594, 0.002908945083618164, 0.0035963058471679688, 0.0042836666107177734, 0.004971027374267578, 0.005658388137817383, 0.0063457489013671875, 0.007033109664916992, 0.007720470428466797, 0.008407831192016602, 0.009095191955566406, 0.009782552719116211, 0.010469913482666016, 0.01115727424621582, 0.011844635009765625, 0.01253199577331543, 0.013219356536865234, 0.013906717300415039, 0.014594078063964844, 0.015281438827514648, 0.015968799591064453, 0.016656160354614258, 0.017343521118164062, 0.018030881881713867, 0.018718242645263672, 0.019405603408813477, 0.02009296417236328, 0.020780324935913086, 0.02146768569946289, 0.022155046463012695, 0.0228424072265625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 5.0, 7.0, 6.0, 10.0, 5.0, 18.0, 18.0, 31.0, 56.0, 44.0, 64.0, 127.0, 168.0, 210.0, 312.0, 450.0, 679.0, 1031.0, 1484.0, 2293.0, 3653.0, 5821.0, 9826.0, 17156.0, 31753.0, 65354.0, 171473.0, 450187.0, 153897.0, 60776.0, 30080.0, 16269.0, 9334.0, 5673.0, 3478.0, 2221.0, 1520.0, 952.0, 694.0, 447.0, 304.0, 202.0, 144.0, 117.0, 64.0, 51.0, 28.0, 22.0, 16.0, 14.0, 10.0, 2.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.010772705078125, -0.010430216789245605, -0.010087728500366211, -0.009745240211486816, -0.009402751922607422, -0.009060263633728027, -0.008717775344848633, -0.008375287055969238, -0.008032798767089844, -0.007690310478210449, -0.007347822189331055, -0.00700533390045166, -0.006662845611572266, -0.006320357322692871, -0.0059778690338134766, -0.005635380744934082, -0.0052928924560546875, -0.004950404167175293, -0.0046079158782958984, -0.004265427589416504, -0.003922939300537109, -0.003580451011657715, -0.0032379627227783203, -0.0028954744338989258, -0.0025529861450195312, -0.0022104978561401367, -0.0018680095672607422, -0.0015255212783813477, -0.0011830329895019531, -0.0008405447006225586, -0.0004980564117431641, -0.00015556812286376953, 0.000186920166015625, 0.0005294084548950195, 0.0008718967437744141, 0.0012143850326538086, 0.0015568733215332031, 0.0018993616104125977, 0.002241849899291992, 0.0025843381881713867, 0.0029268264770507812, 0.0032693147659301758, 0.0036118030548095703, 0.003954291343688965, 0.004296779632568359, 0.004639267921447754, 0.0049817562103271484, 0.005324244499206543, 0.0056667327880859375, 0.006009221076965332, 0.0063517093658447266, 0.006694197654724121, 0.007036685943603516, 0.00737917423248291, 0.007721662521362305, 0.0080641508102417, 0.008406639099121094, 0.008749127388000488, 0.009091615676879883, 0.009434103965759277, 0.009776592254638672, 0.010119080543518066, 0.010461568832397461, 0.010804057121276855, 0.01114654541015625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 7.0, 7.0, 17.0, 19.0, 10.0, 23.0, 22.0, 35.0, 31.0, 44.0, 39.0, 48.0, 48.0, 42.0, 56.0, 44.0, 51.0, 48.0, 52.0, 46.0, 38.0, 33.0, 27.0, 25.0, 28.0, 22.0, 18.0, 27.0, 23.0, 14.0, 14.0, 11.0, 6.0, 1.0, 9.0, 4.0, 2.0, 2.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.017822265625, -0.017313003540039062, -0.016803741455078125, -0.016294479370117188, -0.01578521728515625, -0.015275955200195312, -0.014766693115234375, -0.014257431030273438, -0.0137481689453125, -0.013238906860351562, -0.012729644775390625, -0.012220382690429688, -0.01171112060546875, -0.011201858520507812, -0.010692596435546875, -0.010183334350585938, -0.009674072265625, -0.009164810180664062, -0.008655548095703125, -0.008146286010742188, -0.00763702392578125, -0.0071277618408203125, -0.006618499755859375, -0.0061092376708984375, -0.0055999755859375, -0.0050907135009765625, -0.004581451416015625, -0.0040721893310546875, -0.00356292724609375, -0.0030536651611328125, -0.002544403076171875, -0.0020351409912109375, -0.00152587890625, -0.0010166168212890625, -0.000507354736328125, 1.9073486328125e-06, 0.00051116943359375, 0.0010204315185546875, 0.001529693603515625, 0.0020389556884765625, 0.0025482177734375, 0.0030574798583984375, 0.003566741943359375, 0.0040760040283203125, 0.00458526611328125, 0.0050945281982421875, 0.005603790283203125, 0.0061130523681640625, 0.006622314453125, 0.0071315765380859375, 0.007640838623046875, 0.008150100708007812, 0.00865936279296875, 0.009168624877929688, 0.009677886962890625, 0.010187149047851562, 0.0106964111328125, 0.011205673217773438, 0.011714935302734375, 0.012224197387695312, 0.01273345947265625, 0.013242721557617188, 0.013751983642578125, 0.014261245727539062, 0.0147705078125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 9.0, 12.0, 19.0, 24.0, 36.0, 35.0, 43.0, 71.0, 109.0, 170.0, 207.0, 308.0, 433.0, 652.0, 1064.0, 1581.0, 2566.0, 4479.0, 8108.0, 16407.0, 40814.0, 167793.0, 662831.0, 85304.0, 27429.0, 12020.0, 6278.0, 3554.0, 2219.0, 1313.0, 853.0, 588.0, 391.0, 226.0, 169.0, 122.0, 84.0, 62.0, 42.0, 39.0, 29.0, 15.0, 11.0, 5.0, 5.0, 1.0, 8.0, 9.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.0008821487426757812, -0.000850975513458252, -0.0008198022842407227, -0.0007886290550231934, -0.0007574558258056641, -0.0007262825965881348, -0.0006951093673706055, -0.0006639361381530762, -0.0006327629089355469, -0.0006015896797180176, -0.0005704164505004883, -0.000539243221282959, -0.0005080699920654297, -0.0004768967628479004, -0.0004457235336303711, -0.0004145503044128418, -0.0003833770751953125, -0.0003522038459777832, -0.0003210306167602539, -0.0002898573875427246, -0.0002586841583251953, -0.00022751092910766602, -0.00019633769989013672, -0.00016516447067260742, -0.00013399124145507812, -0.00010281801223754883, -7.164478302001953e-05, -4.0471553802490234e-05, -9.298324584960938e-06, 2.187490463256836e-05, 5.3048133850097656e-05, 8.422136306762695e-05, 0.00011539459228515625, 0.00014656782150268555, 0.00017774105072021484, 0.00020891427993774414, 0.00024008750915527344, 0.00027126073837280273, 0.00030243396759033203, 0.00033360719680786133, 0.0003647804260253906, 0.0003959536552429199, 0.0004271268844604492, 0.0004583001136779785, 0.0004894733428955078, 0.0005206465721130371, 0.0005518198013305664, 0.0005829930305480957, 0.000614166259765625, 0.0006453394889831543, 0.0006765127182006836, 0.0007076859474182129, 0.0007388591766357422, 0.0007700324058532715, 0.0008012056350708008, 0.0008323788642883301, 0.0008635520935058594, 0.0008947253227233887, 0.000925898551940918, 0.0009570717811584473, 0.0009882450103759766, 0.0010194182395935059, 0.0010505914688110352, 0.0010817646980285645, 0.0011129379272460938]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 7.0, 14.0, 8.0, 0.0, 13.0, 27.0, 20.0, 38.0, 0.0, 52.0, 60.0, 67.0, 75.0, 0.0, 89.0, 102.0, 85.0, 88.0, 0.0, 56.0, 54.0, 34.0, 21.0, 0.0, 18.0, 28.0, 16.0, 5.0, 0.0, 11.0, 5.0, 2.0, 4.0, 0.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2516975402832031e-06, -1.2042000889778137e-06, -1.1567026376724243e-06, -1.109205186367035e-06, -1.0617077350616455e-06, -1.014210283756256e-06, -9.667128324508667e-07, -9.192153811454773e-07, -8.717179298400879e-07, -8.242204785346985e-07, -7.767230272293091e-07, -7.292255759239197e-07, -6.817281246185303e-07, -6.342306733131409e-07, -5.867332220077515e-07, -5.392357707023621e-07, -4.917383193969727e-07, -4.4424086809158325e-07, -3.9674341678619385e-07, -3.4924596548080444e-07, -3.0174851417541504e-07, -2.5425106287002563e-07, -2.0675361156463623e-07, -1.5925616025924683e-07, -1.1175870895385742e-07, -6.426125764846802e-08, -1.6763806343078613e-08, 3.073364496231079e-08, 7.82310962677002e-08, 1.257285475730896e-07, 1.73225998878479e-07, 2.207234501838684e-07, 2.682209014892578e-07, 3.157183527946472e-07, 3.632158041000366e-07, 4.10713255405426e-07, 4.5821070671081543e-07, 5.057081580162048e-07, 5.532056093215942e-07, 6.007030606269836e-07, 6.48200511932373e-07, 6.956979632377625e-07, 7.431954145431519e-07, 7.906928658485413e-07, 8.381903171539307e-07, 8.856877684593201e-07, 9.331852197647095e-07, 9.806826710700989e-07, 1.0281801223754883e-06, 1.0756775736808777e-06, 1.123175024986267e-06, 1.1706724762916565e-06, 1.218169927597046e-06, 1.2656673789024353e-06, 1.3131648302078247e-06, 1.3606622815132141e-06, 1.4081597328186035e-06, 1.455657184123993e-06, 1.5031546354293823e-06, 1.5506520867347717e-06, 1.5981495380401611e-06, 1.6456469893455505e-06, 1.69314444065094e-06, 1.7406418919563293e-06, 1.7881393432617188e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 9.0, 7.0, 9.0, 25.0, 25.0, 32.0, 57.0, 95.0, 124.0, 205.0, 284.0, 413.0, 628.0, 1032.0, 1806.0, 3042.0, 5589.0, 11979.0, 29091.0, 93561.0, 614812.0, 201313.0, 48559.0, 17890.0, 7922.0, 4048.0, 2257.0, 1327.0, 869.0, 507.0, 371.0, 194.0, 152.0, 98.0, 80.0, 49.0, 32.0, 20.0, 14.0, 16.0, 5.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012159347534179688, -0.0011750459671020508, -0.0011341571807861328, -0.0010932683944702148, -0.0010523796081542969, -0.001011490821838379, -0.0009706020355224609, -0.000929713249206543, -0.000888824462890625, -0.000847935676574707, -0.0008070468902587891, -0.0007661581039428711, -0.0007252693176269531, -0.0006843805313110352, -0.0006434917449951172, -0.0006026029586791992, -0.0005617141723632812, -0.0005208253860473633, -0.0004799365997314453, -0.00043904781341552734, -0.0003981590270996094, -0.0003572702407836914, -0.00031638145446777344, -0.00027549266815185547, -0.0002346038818359375, -0.00019371509552001953, -0.00015282630920410156, -0.0001119375228881836, -7.104873657226562e-05, -3.0159950256347656e-05, 1.0728836059570312e-05, 5.161762237548828e-05, 9.250640869140625e-05, 0.00013339519500732422, 0.0001742839813232422, 0.00021517276763916016, 0.0002560615539550781, 0.0002969503402709961, 0.00033783912658691406, 0.00037872791290283203, 0.00041961669921875, 0.00046050548553466797, 0.0005013942718505859, 0.0005422830581665039, 0.0005831718444824219, 0.0006240606307983398, 0.0006649494171142578, 0.0007058382034301758, 0.0007467269897460938, 0.0007876157760620117, 0.0008285045623779297, 0.0008693933486938477, 0.0009102821350097656, 0.0009511709213256836, 0.0009920597076416016, 0.0010329484939575195, 0.0010738372802734375, 0.0011147260665893555, 0.0011556148529052734, 0.0011965036392211914, 0.0012373924255371094, 0.0012782812118530273, 0.0013191699981689453, 0.0013600587844848633, 0.0014009475708007812]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 4.0, 5.0, 9.0, 4.0, 7.0, 12.0, 16.0, 21.0, 25.0, 42.0, 44.0, 91.0, 181.0, 227.0, 92.0, 56.0, 44.0, 25.0, 19.0, 9.0, 11.0, 11.0, 12.0, 5.0, 2.0, 4.0, 6.0, 1.0, 7.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0004661083221435547, -0.0004528351128101349, -0.0004395619034767151, -0.0004262886941432953, -0.0004130154848098755, -0.0003997422754764557, -0.0003864690661430359, -0.0003731958568096161, -0.0003599226474761963, -0.0003466494381427765, -0.0003333762288093567, -0.0003201030194759369, -0.0003068298101425171, -0.0002935566008090973, -0.0002802833914756775, -0.0002670101821422577, -0.0002537369728088379, -0.0002404637634754181, -0.0002271905541419983, -0.0002139173448085785, -0.0002006441354751587, -0.0001873709261417389, -0.0001740977168083191, -0.0001608245074748993, -0.0001475512981414795, -0.0001342780888080597, -0.00012100487947463989, -0.00010773167014122009, -9.445846080780029e-05, -8.118525147438049e-05, -6.79120421409607e-05, -5.4638832807540894e-05, -4.1365623474121094e-05, -2.8092414140701294e-05, -1.4819204807281494e-05, -1.5459954738616943e-06, 1.1727213859558105e-05, 2.5000423192977905e-05, 3.8273632526397705e-05, 5.1546841859817505e-05, 6.48200511932373e-05, 7.80932605266571e-05, 9.13664698600769e-05, 0.0001046396791934967, 0.0001179128885269165, 0.0001311860978603363, 0.0001444593071937561, 0.0001577325165271759, 0.0001710057258605957, 0.0001842789351940155, 0.0001975521445274353, 0.0002108253538608551, 0.0002240985631942749, 0.0002373717725276947, 0.0002506449818611145, 0.0002639181911945343, 0.0002771914005279541, 0.0002904646098613739, 0.0003037378191947937, 0.0003170110285282135, 0.0003302842378616333, 0.0003435574471950531, 0.0003568306565284729, 0.0003701038658618927, 0.0003833770751953125]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 15.0, 13.0, 27.0, 28.0, 40.0, 51.0, 80.0, 85.0, 132.0, 127.0, 107.0, 67.0, 47.0, 32.0, 38.0, 24.0, 18.0, 15.0, 7.0, 8.0, 8.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039350349456071854, -0.03812248259782791, -0.03689461573958397, -0.035666752606630325, -0.03443888574838638, -0.03321101889014244, -0.0319831520318985, -0.030755285173654556, -0.029527420178055763, -0.02829955331981182, -0.027071688324213028, -0.025843821465969086, -0.024615954607725143, -0.02338808961212635, -0.022160222753882408, -0.020932357758283615, -0.019704490900039673, -0.01847662404179573, -0.017248759046196938, -0.016020892187952995, -0.014793026261031628, -0.01356516033411026, -0.012337293475866318, -0.01110942754894495, -0.009881561622023582, -0.008653695695102215, -0.00742582930251956, -0.006197962909936905, -0.004970096983015537, -0.0037422310560941696, -0.0025143646635115147, -0.0012864982709288597, -5.8628618717193604e-05, 0.0011692375410348177, 0.002397103700786829, 0.0036249698605388403, 0.004852836020290852, 0.006080701947212219, 0.007308568339794874, 0.00853643473237753, 0.009764300659298897, 0.010992166586220264, 0.012220032513141632, 0.013447899371385574, 0.014675765298306942, 0.01590363122522831, 0.017131498083472252, 0.018359363079071045, 0.019587229937314987, 0.02081509679555893, 0.022042961791157722, 0.023270828649401665, 0.024498693645000458, 0.0257265605032444, 0.026954427361488342, 0.028182294219732285, 0.029410159215331078, 0.03063802607357502, 0.03186589106917381, 0.033093757927417755, 0.0343216247856617, 0.03554949164390564, 0.03677735477685928, 0.038005221635103226, 0.03923308849334717]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 3.0, 0.0, 5.0, 5.0, 2.0, 7.0, 10.0, 12.0, 14.0, 13.0, 14.0, 15.0, 21.0, 23.0, 23.0, 24.0, 32.0, 39.0, 28.0, 34.0, 23.0, 35.0, 40.0, 38.0, 37.0, 26.0, 30.0, 40.0, 40.0, 32.0, 31.0, 29.0, 26.0, 34.0, 31.0, 22.0, 30.0, 24.0, 11.0, 20.0, 17.0, 9.0, 13.0, 11.0, 10.0, 5.0, 3.0, 8.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.01852143369615078, -0.017891794443130493, -0.017262155190110207, -0.01663251593708992, -0.016002876684069633, -0.015373237431049347, -0.014743597246706486, -0.0141139579936862, -0.013484318740665913, -0.012854679487645626, -0.01222504023462534, -0.011595400981605053, -0.010965760797262192, -0.010336121544241905, -0.009706482291221619, -0.009076843038201332, -0.008447203785181046, -0.007817564532160759, -0.007187925279140472, -0.0065582855604588985, -0.005928646307438612, -0.005299007054418325, -0.0046693673357367516, -0.004039728082716465, -0.0034100888296961784, -0.002780449576675892, -0.0021508100908249617, -0.0015211707213893533, -0.0008915313519537449, -0.00026189209893345833, 0.0003677473869174719, 0.000997386872768402, 0.0016270279884338379, 0.0022566672414541245, 0.0028863067273050547, 0.003515946213155985, 0.0041455854661762714, 0.004775224719196558, 0.005404864437878132, 0.006034503690898418, 0.006664142943918705, 0.0072937821969389915, 0.007923421449959278, 0.008553060702979565, 0.009182700887322426, 0.009812340140342712, 0.010441979393362999, 0.011071618646383286, 0.011701257899403572, 0.012330897152423859, 0.012960536405444145, 0.013590175658464432, 0.014219814911484718, 0.014849454164505005, 0.015479094348847866, 0.016108732670545578, 0.016738373786211014, 0.0173680130392313, 0.017997652292251587, 0.018627291545271873, 0.01925693079829216, 0.019886570051312447, 0.020516209304332733, 0.02114585041999817, 0.021775487810373306]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 6.0, 12.0, 14.0, 19.0, 42.0, 42.0, 79.0, 129.0, 157.0, 220.0, 332.0, 537.0, 721.0, 1026.0, 1526.0, 2034.0, 3021.0, 4281.0, 6284.0, 9379.0, 13556.0, 20972.0, 32320.0, 52223.0, 87046.0, 152782.0, 245589.0, 165058.0, 92300.0, 54961.0, 34238.0, 21815.0, 14547.0, 9776.0, 6572.0, 4546.0, 3245.0, 2231.0, 1495.0, 1030.0, 720.0, 519.0, 405.0, 253.0, 173.0, 100.0, 83.0, 39.0, 35.0, 27.0, 16.0, 14.0, 5.0, 2.0, 2.0, 3.0, 2.0], "bins": [-0.04071044921875, -0.03949737548828125, -0.0382843017578125, -0.03707122802734375, -0.035858154296875, -0.03464508056640625, -0.0334320068359375, -0.03221893310546875, -0.031005859375, -0.02979278564453125, -0.0285797119140625, -0.02736663818359375, -0.026153564453125, -0.02494049072265625, -0.0237274169921875, -0.02251434326171875, -0.02130126953125, -0.02008819580078125, -0.0188751220703125, -0.01766204833984375, -0.016448974609375, -0.01523590087890625, -0.0140228271484375, -0.01280975341796875, -0.0115966796875, -0.01038360595703125, -0.0091705322265625, -0.00795745849609375, -0.006744384765625, -0.00553131103515625, -0.0043182373046875, -0.00310516357421875, -0.00189208984375, -0.00067901611328125, 0.0005340576171875, 0.00174713134765625, 0.002960205078125, 0.00417327880859375, 0.0053863525390625, 0.00659942626953125, 0.0078125, 0.00902557373046875, 0.0102386474609375, 0.01145172119140625, 0.012664794921875, 0.01387786865234375, 0.0150909423828125, 0.01630401611328125, 0.01751708984375, 0.01873016357421875, 0.0199432373046875, 0.02115631103515625, 0.022369384765625, 0.02358245849609375, 0.0247955322265625, 0.02600860595703125, 0.0272216796875, 0.02843475341796875, 0.0296478271484375, 0.03086090087890625, 0.032073974609375, 0.03328704833984375, 0.0345001220703125, 0.03571319580078125, 0.03692626953125]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 4.0, 4.0, 1.0, 2.0, 4.0, 5.0, 5.0, 7.0, 13.0, 14.0, 18.0, 16.0, 19.0, 19.0, 31.0, 26.0, 24.0, 29.0, 30.0, 29.0, 44.0, 30.0, 49.0, 36.0, 29.0, 41.0, 38.0, 45.0, 48.0, 39.0, 32.0, 20.0, 37.0, 31.0, 25.0, 26.0, 17.0, 19.0, 20.0, 9.0, 11.0, 12.0, 12.0, 6.0, 6.0, 5.0, 7.0, 9.0, 6.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0166015625, -0.01603102684020996, -0.015460491180419922, -0.014889955520629883, -0.014319419860839844, -0.013748884201049805, -0.013178348541259766, -0.012607812881469727, -0.012037277221679688, -0.011466741561889648, -0.01089620590209961, -0.01032567024230957, -0.009755134582519531, -0.009184598922729492, -0.008614063262939453, -0.008043527603149414, -0.007472991943359375, -0.006902456283569336, -0.006331920623779297, -0.005761384963989258, -0.005190849304199219, -0.00462031364440918, -0.004049777984619141, -0.0034792423248291016, -0.0029087066650390625, -0.0023381710052490234, -0.0017676353454589844, -0.0011970996856689453, -0.0006265640258789062, -5.602836608886719e-05, 0.0005145072937011719, 0.001085042953491211, 0.00165557861328125, 0.002226114273071289, 0.002796649932861328, 0.003367185592651367, 0.003937721252441406, 0.004508256912231445, 0.005078792572021484, 0.0056493282318115234, 0.0062198638916015625, 0.0067903995513916016, 0.007360935211181641, 0.00793147087097168, 0.008502006530761719, 0.009072542190551758, 0.009643077850341797, 0.010213613510131836, 0.010784149169921875, 0.011354684829711914, 0.011925220489501953, 0.012495756149291992, 0.013066291809082031, 0.01363682746887207, 0.01420736312866211, 0.014777898788452148, 0.015348434448242188, 0.015918970108032227, 0.016489505767822266, 0.017060041427612305, 0.017630577087402344, 0.018201112747192383, 0.018771648406982422, 0.01934218406677246, 0.0199127197265625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 5.0, 15.0, 11.0, 12.0, 30.0, 36.0, 54.0, 76.0, 126.0, 194.0, 278.0, 499.0, 790.0, 1367.0, 2086.0, 3453.0, 5670.0, 9546.0, 16148.0, 27558.0, 48540.0, 88511.0, 171540.0, 308674.0, 164885.0, 85086.0, 47242.0, 26823.0, 15620.0, 9260.0, 5608.0, 3411.0, 2056.0, 1226.0, 809.0, 481.0, 322.0, 195.0, 107.0, 81.0, 55.0, 28.0, 21.0, 10.0, 6.0, 1.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042694091796875, -0.041245460510253906, -0.03979682922363281, -0.03834819793701172, -0.036899566650390625, -0.03545093536376953, -0.03400230407714844, -0.032553672790527344, -0.03110504150390625, -0.029656410217285156, -0.028207778930664062, -0.02675914764404297, -0.025310516357421875, -0.02386188507080078, -0.022413253784179688, -0.020964622497558594, -0.0195159912109375, -0.018067359924316406, -0.016618728637695312, -0.015170097351074219, -0.013721466064453125, -0.012272834777832031, -0.010824203491210938, -0.009375572204589844, -0.00792694091796875, -0.006478309631347656, -0.0050296783447265625, -0.0035810470581054688, -0.002132415771484375, -0.0006837844848632812, 0.0007648468017578125, 0.0022134780883789062, 0.003662109375, 0.005110740661621094, 0.0065593719482421875, 0.008008003234863281, 0.009456634521484375, 0.010905265808105469, 0.012353897094726562, 0.013802528381347656, 0.01525115966796875, 0.016699790954589844, 0.018148422241210938, 0.01959705352783203, 0.021045684814453125, 0.02249431610107422, 0.023942947387695312, 0.025391578674316406, 0.0268402099609375, 0.028288841247558594, 0.029737472534179688, 0.03118610382080078, 0.032634735107421875, 0.03408336639404297, 0.03553199768066406, 0.036980628967285156, 0.03842926025390625, 0.039877891540527344, 0.04132652282714844, 0.04277515411376953, 0.044223785400390625, 0.04567241668701172, 0.04712104797363281, 0.048569679260253906, 0.050018310546875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 7.0, 5.0, 10.0, 11.0, 12.0, 21.0, 15.0, 18.0, 21.0, 20.0, 24.0, 17.0, 32.0, 31.0, 27.0, 30.0, 34.0, 29.0, 32.0, 36.0, 47.0, 33.0, 55.0, 50.0, 34.0, 42.0, 33.0, 28.0, 27.0, 27.0, 28.0, 19.0, 16.0, 22.0, 19.0, 16.0, 10.0, 11.0, 8.0, 6.0, 15.0, 5.0, 7.0, 2.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.01187896728515625, -0.011524677276611328, -0.011170387268066406, -0.010816097259521484, -0.010461807250976562, -0.01010751724243164, -0.009753227233886719, -0.009398937225341797, -0.009044647216796875, -0.008690357208251953, -0.008336067199707031, -0.00798177719116211, -0.0076274871826171875, -0.007273197174072266, -0.006918907165527344, -0.006564617156982422, -0.0062103271484375, -0.005856037139892578, -0.005501747131347656, -0.005147457122802734, -0.0047931671142578125, -0.004438877105712891, -0.004084587097167969, -0.003730297088623047, -0.003376007080078125, -0.003021717071533203, -0.0026674270629882812, -0.0023131370544433594, -0.0019588470458984375, -0.0016045570373535156, -0.0012502670288085938, -0.0008959770202636719, -0.00054168701171875, -0.00018739700317382812, 0.00016689300537109375, 0.0005211830139160156, 0.0008754730224609375, 0.0012297630310058594, 0.0015840530395507812, 0.0019383430480957031, 0.002292633056640625, 0.002646923065185547, 0.0030012130737304688, 0.0033555030822753906, 0.0037097930908203125, 0.004064083099365234, 0.004418373107910156, 0.004772663116455078, 0.005126953125, 0.005481243133544922, 0.005835533142089844, 0.006189823150634766, 0.0065441131591796875, 0.006898403167724609, 0.007252693176269531, 0.007606983184814453, 0.007961273193359375, 0.008315563201904297, 0.008669853210449219, 0.00902414321899414, 0.009378433227539062, 0.009732723236083984, 0.010087013244628906, 0.010441303253173828, 0.01079559326171875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 8.0, 11.0, 23.0, 18.0, 22.0, 62.0, 68.0, 98.0, 152.0, 229.0, 354.0, 567.0, 796.0, 1237.0, 2030.0, 3418.0, 6244.0, 11914.0, 25520.0, 67533.0, 457847.0, 357987.0, 62333.0, 24090.0, 11239.0, 5845.0, 3335.0, 2010.0, 1248.0, 795.0, 517.0, 325.0, 215.0, 142.0, 112.0, 52.0, 56.0, 33.0, 15.0, 27.0, 7.0, 7.0, 6.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.0013170242309570312, -0.0012793540954589844, -0.0012416839599609375, -0.0012040138244628906, -0.0011663436889648438, -0.0011286735534667969, -0.00109100341796875, -0.0010533332824707031, -0.0010156631469726562, -0.0009779930114746094, -0.0009403228759765625, -0.0009026527404785156, -0.0008649826049804688, -0.0008273124694824219, -0.000789642333984375, -0.0007519721984863281, -0.0007143020629882812, -0.0006766319274902344, -0.0006389617919921875, -0.0006012916564941406, -0.0005636215209960938, -0.0005259513854980469, -0.00048828125, -0.0004506111145019531, -0.00041294097900390625, -0.0003752708435058594, -0.0003376007080078125, -0.0002999305725097656, -0.00026226043701171875, -0.00022459030151367188, -0.000186920166015625, -0.00014925003051757812, -0.00011157989501953125, -7.390975952148438e-05, -3.62396240234375e-05, 1.430511474609375e-06, 3.910064697265625e-05, 7.677078247070312e-05, 0.00011444091796875, 0.00015211105346679688, 0.00018978118896484375, 0.00022745132446289062, 0.0002651214599609375, 0.0003027915954589844, 0.00034046173095703125, 0.0003781318664550781, 0.000415802001953125, 0.0004534721374511719, 0.0004911422729492188, 0.0005288124084472656, 0.0005664825439453125, 0.0006041526794433594, 0.0006418228149414062, 0.0006794929504394531, 0.0007171630859375, 0.0007548332214355469, 0.0007925033569335938, 0.0008301734924316406, 0.0008678436279296875, 0.0009055137634277344, 0.0009431838989257812, 0.0009808540344238281, 0.001018524169921875, 0.0010561943054199219, 0.0010938644409179688]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 0.0, 7.0, 0.0, 12.0, 0.0, 7.0, 0.0, 22.0, 0.0, 30.0, 0.0, 43.0, 0.0, 62.0, 0.0, 120.0, 0.0, 117.0, 0.0, 152.0, 0.0, 129.0, 0.0, 0.0, 105.0, 0.0, 81.0, 0.0, 45.0, 0.0, 28.0, 0.0, 15.0, 0.0, 18.0, 0.0, 8.0, 0.0, 7.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.344650268554688e-07, -8.055940270423889e-07, -7.767230272293091e-07, -7.478520274162292e-07, -7.189810276031494e-07, -6.901100277900696e-07, -6.612390279769897e-07, -6.323680281639099e-07, -6.034970283508301e-07, -5.746260285377502e-07, -5.457550287246704e-07, -5.168840289115906e-07, -4.880130290985107e-07, -4.591420292854309e-07, -4.302710294723511e-07, -4.0140002965927124e-07, -3.725290298461914e-07, -3.4365803003311157e-07, -3.1478703022003174e-07, -2.859160304069519e-07, -2.5704503059387207e-07, -2.2817403078079224e-07, -1.993030309677124e-07, -1.7043203115463257e-07, -1.4156103134155273e-07, -1.126900315284729e-07, -8.381903171539307e-08, -5.494803190231323e-08, -2.60770320892334e-08, 2.7939677238464355e-09, 3.166496753692627e-08, 6.05359673500061e-08, 8.940696716308594e-08, 1.1827796697616577e-07, 1.471489667892456e-07, 1.7601996660232544e-07, 2.0489096641540527e-07, 2.337619662284851e-07, 2.6263296604156494e-07, 2.915039658546448e-07, 3.203749656677246e-07, 3.4924596548080444e-07, 3.781169652938843e-07, 4.069879651069641e-07, 4.3585896492004395e-07, 4.647299647331238e-07, 4.936009645462036e-07, 5.224719643592834e-07, 5.513429641723633e-07, 5.802139639854431e-07, 6.09084963798523e-07, 6.379559636116028e-07, 6.668269634246826e-07, 6.956979632377625e-07, 7.245689630508423e-07, 7.534399628639221e-07, 7.82310962677002e-07, 8.111819624900818e-07, 8.400529623031616e-07, 8.689239621162415e-07, 8.977949619293213e-07, 9.266659617424011e-07, 9.55536961555481e-07, 9.844079613685608e-07, 1.0132789611816406e-06]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 2.0, 5.0, 13.0, 2.0, 12.0, 11.0, 23.0, 28.0, 47.0, 62.0, 72.0, 111.0, 124.0, 186.0, 226.0, 328.0, 488.0, 685.0, 963.0, 1454.0, 2136.0, 3351.0, 5121.0, 8364.0, 14186.0, 26110.0, 55265.0, 193396.0, 552752.0, 95327.0, 37960.0, 19585.0, 10839.0, 6635.0, 4178.0, 2670.0, 1736.0, 1222.0, 776.0, 528.0, 448.0, 310.0, 209.0, 164.0, 130.0, 67.0, 74.0, 47.0, 32.0, 37.0, 21.0, 11.0, 8.0, 9.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0009026527404785156, -0.0008737817406654358, -0.000844910740852356, -0.0008160397410392761, -0.0007871687412261963, -0.0007582977414131165, -0.0007294267416000366, -0.0007005557417869568, -0.000671684741973877, -0.0006428137421607971, -0.0006139427423477173, -0.0005850717425346375, -0.0005562007427215576, -0.0005273297429084778, -0.000498458743095398, -0.0004695877432823181, -0.0004407167434692383, -0.00041184574365615845, -0.0003829747438430786, -0.0003541037440299988, -0.00032523274421691895, -0.0002963617444038391, -0.0002674907445907593, -0.00023861974477767944, -0.0002097487449645996, -0.00018087774515151978, -0.00015200674533843994, -0.0001231357455253601, -9.426474571228027e-05, -6.539374589920044e-05, -3.6522746086120605e-05, -7.651746273040771e-06, 2.1219253540039062e-05, 5.0090253353118896e-05, 7.896125316619873e-05, 0.00010783225297927856, 0.0001367032527923584, 0.00016557425260543823, 0.00019444525241851807, 0.0002233162522315979, 0.00025218725204467773, 0.00028105825185775757, 0.0003099292516708374, 0.00033880025148391724, 0.00036767125129699707, 0.0003965422511100769, 0.00042541325092315674, 0.00045428425073623657, 0.0004831552505493164, 0.0005120262503623962, 0.0005408972501754761, 0.0005697682499885559, 0.0005986392498016357, 0.0006275102496147156, 0.0006563812494277954, 0.0006852522492408752, 0.0007141232490539551, 0.0007429942488670349, 0.0007718652486801147, 0.0008007362484931946, 0.0008296072483062744, 0.0008584782481193542, 0.0008873492479324341, 0.0009162202477455139, 0.0009450912475585938]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 8.0, 9.0, 5.0, 8.0, 9.0, 17.0, 21.0, 14.0, 24.0, 23.0, 28.0, 33.0, 82.0, 150.0, 169.0, 101.0, 79.0, 53.0, 39.0, 36.0, 16.0, 19.0, 13.0, 11.0, 6.0, 8.0, 3.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00028896331787109375, -0.0002794191241264343, -0.0002698749303817749, -0.0002603307366371155, -0.00025078654289245605, -0.00024124234914779663, -0.0002316981554031372, -0.00022215396165847778, -0.00021260976791381836, -0.00020306557416915894, -0.0001935213804244995, -0.0001839771866798401, -0.00017443299293518066, -0.00016488879919052124, -0.00015534460544586182, -0.0001458004117012024, -0.00013625621795654297, -0.00012671202421188354, -0.00011716783046722412, -0.0001076236367225647, -9.807944297790527e-05, -8.853524923324585e-05, -7.899105548858643e-05, -6.9446861743927e-05, -5.990266799926758e-05, -5.0358474254608154e-05, -4.081428050994873e-05, -3.127008676528931e-05, -2.1725893020629883e-05, -1.2181699275970459e-05, -2.637505531311035e-06, 6.906688213348389e-06, 1.6450881958007812e-05, 2.5995075702667236e-05, 3.553926944732666e-05, 4.5083463191986084e-05, 5.462765693664551e-05, 6.417185068130493e-05, 7.371604442596436e-05, 8.326023817062378e-05, 9.28044319152832e-05, 0.00010234862565994263, 0.00011189281940460205, 0.00012143701314926147, 0.0001309812068939209, 0.00014052540063858032, 0.00015006959438323975, 0.00015961378812789917, 0.0001691579818725586, 0.00017870217561721802, 0.00018824636936187744, 0.00019779056310653687, 0.0002073347568511963, 0.0002168789505958557, 0.00022642314434051514, 0.00023596733808517456, 0.000245511531829834, 0.0002550557255744934, 0.00026459991931915283, 0.00027414411306381226, 0.0002836883068084717, 0.0002932325005531311, 0.00030277669429779053, 0.00031232088804244995, 0.0003218650817871094]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 9.0, 12.0, 11.0, 8.0, 18.0, 31.0, 36.0, 71.0, 95.0, 118.0, 151.0, 114.0, 95.0, 62.0, 46.0, 24.0, 30.0, 19.0, 18.0, 8.0, 8.0, 2.0, 5.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03794517740607262, -0.03670559823513031, -0.0354660227894783, -0.034226443618535995, -0.03298686444759369, -0.03174728527665138, -0.030507707968354225, -0.029268130660057068, -0.02802855148911476, -0.026788972318172455, -0.025549395009875298, -0.02430981770157814, -0.023070238530635834, -0.021830659359693527, -0.02059108205139637, -0.019351504743099213, -0.018111925572156906, -0.0168723464012146, -0.015632769092917442, -0.01439319085329771, -0.013153612613677979, -0.011914034374058247, -0.010674456134438515, -0.009434877894818783, -0.008195299655199051, -0.006955721415579319, -0.005716143175959587, -0.004476564936339855, -0.0032369866967201233, -0.0019974084571003914, -0.0007578302174806595, 0.0004817480221390724, 0.0017213225364685059, 0.0029609007760882378, 0.00420047901570797, 0.005440057255327702, 0.0066796354949474335, 0.007919213734567165, 0.009158791974186897, 0.01039837021380663, 0.011637948453426361, 0.012877526693046093, 0.014117104932665825, 0.015356683172285557, 0.01659626141190529, 0.017835840582847595, 0.019075417891144753, 0.02031499519944191, 0.021554574370384216, 0.022794153541326523, 0.02403373084962368, 0.025273308157920837, 0.026512887328863144, 0.02775246649980545, 0.028992043808102608, 0.030231621116399765, 0.03147120028734207, 0.03271077945828438, 0.033950358629226685, 0.03518993407487869, 0.036429513245821, 0.037669092416763306, 0.038908667862415314, 0.04014824703335762, 0.04138782620429993]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 6.0, 8.0, 13.0, 10.0, 14.0, 17.0, 23.0, 24.0, 18.0, 32.0, 25.0, 32.0, 27.0, 27.0, 38.0, 31.0, 42.0, 34.0, 42.0, 45.0, 34.0, 36.0, 32.0, 34.0, 39.0, 34.0, 31.0, 30.0, 24.0, 24.0, 21.0, 24.0, 20.0, 18.0, 15.0, 11.0, 12.0, 12.0, 4.0, 9.0, 8.0, 7.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.018594810739159584, -0.01800922304391861, -0.017423633486032486, -0.01683804579079151, -0.016252458095550537, -0.015666870400309563, -0.015081281773746014, -0.014495693147182465, -0.01391010545194149, -0.013324517756700516, -0.012738929130136967, -0.012153340503573418, -0.011567752808332443, -0.010982165113091469, -0.01039657648652792, -0.00981098785996437, -0.009225400164723396, -0.008639812469482422, -0.008054223842918873, -0.007468635682016611, -0.006883047521114349, -0.006297459360212088, -0.005711871199309826, -0.005126283038407564, -0.004540694877505302, -0.003955106716603041, -0.003369518555700779, -0.0027839303947985172, -0.0021983422338962555, -0.0016127540729939938, -0.001027165912091732, -0.0004415777511894703, 0.00014401227235794067, 0.0007296004332602024, 0.0013151885941624641, 0.0019007767550647259, 0.0024863649159669876, 0.0030719530768692493, 0.003657541237771511, 0.004243129398673773, 0.0048287175595760345, 0.005414305720478296, 0.005999893881380558, 0.00658548204228282, 0.0071710702031850815, 0.007756658364087343, 0.008342246524989605, 0.008927835151553154, 0.009513422846794128, 0.010099010542035103, 0.010684599168598652, 0.011270187795162201, 0.011855775490403175, 0.01244136318564415, 0.013026951812207699, 0.013612540438771248, 0.014198128134012222, 0.014783715829253197, 0.015369304455816746, 0.015954893082380295, 0.01654048077762127, 0.017126068472862244, 0.017711658030748367, 0.018297245725989342, 0.018882833421230316]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 8.0, 17.0, 12.0, 25.0, 34.0, 46.0, 67.0, 85.0, 121.0, 179.0, 310.0, 395.0, 621.0, 869.0, 1260.0, 1704.0, 2360.0, 3314.0, 4980.0, 7549.0, 11395.0, 17980.0, 29159.0, 48758.0, 85889.0, 163507.0, 419721.0, 1502218.0, 1218689.0, 329957.0, 142034.0, 76461.0, 44688.0, 27271.0, 17426.0, 11352.0, 7621.0, 5034.0, 3531.0, 2358.0, 1617.0, 1179.0, 788.0, 514.0, 398.0, 253.0, 180.0, 132.0, 79.0, 49.0, 52.0, 25.0, 9.0, 3.0, 4.0, 5.0, 0.0, 3.0], "bins": [-0.0269622802734375, -0.02616715431213379, -0.025372028350830078, -0.024576902389526367, -0.023781776428222656, -0.022986650466918945, -0.022191524505615234, -0.021396398544311523, -0.020601272583007812, -0.0198061466217041, -0.01901102066040039, -0.01821589469909668, -0.01742076873779297, -0.016625642776489258, -0.015830516815185547, -0.015035390853881836, -0.014240264892578125, -0.013445138931274414, -0.012650012969970703, -0.011854887008666992, -0.011059761047363281, -0.01026463508605957, -0.00946950912475586, -0.008674383163452148, -0.007879257202148438, -0.0070841312408447266, -0.006289005279541016, -0.005493879318237305, -0.004698753356933594, -0.003903627395629883, -0.003108501434326172, -0.002313375473022461, -0.00151824951171875, -0.0007231235504150391, 7.200241088867188e-05, 0.0008671283721923828, 0.0016622543334960938, 0.0024573802947998047, 0.0032525062561035156, 0.0040476322174072266, 0.0048427581787109375, 0.0056378841400146484, 0.006433010101318359, 0.00722813606262207, 0.008023262023925781, 0.008818387985229492, 0.009613513946533203, 0.010408639907836914, 0.011203765869140625, 0.011998891830444336, 0.012794017791748047, 0.013589143753051758, 0.014384269714355469, 0.01517939567565918, 0.01597452163696289, 0.0167696475982666, 0.017564773559570312, 0.018359899520874023, 0.019155025482177734, 0.019950151443481445, 0.020745277404785156, 0.021540403366088867, 0.022335529327392578, 0.02313065528869629, 0.02392578125]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 6.0, 9.0, 7.0, 12.0, 11.0, 17.0, 20.0, 18.0, 20.0, 34.0, 20.0, 30.0, 33.0, 33.0, 41.0, 31.0, 34.0, 36.0, 44.0, 48.0, 47.0, 43.0, 34.0, 46.0, 41.0, 32.0, 35.0, 29.0, 20.0, 21.0, 20.0, 20.0, 17.0, 17.0, 15.0, 14.0, 10.0, 5.0, 5.0, 8.0, 5.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.01141357421875, -0.011054158210754395, -0.010694742202758789, -0.010335326194763184, -0.009975910186767578, -0.009616494178771973, -0.009257078170776367, -0.008897662162780762, -0.008538246154785156, -0.00817883014678955, -0.007819414138793945, -0.00745999813079834, -0.007100582122802734, -0.006741166114807129, -0.0063817501068115234, -0.006022334098815918, -0.0056629180908203125, -0.005303502082824707, -0.0049440860748291016, -0.004584670066833496, -0.004225254058837891, -0.003865838050842285, -0.0035064220428466797, -0.0031470060348510742, -0.0027875900268554688, -0.0024281740188598633, -0.002068758010864258, -0.0017093420028686523, -0.0013499259948730469, -0.0009905099868774414, -0.0006310939788818359, -0.00027167797088623047, 8.7738037109375e-05, 0.00044715404510498047, 0.0008065700531005859, 0.0011659860610961914, 0.0015254020690917969, 0.0018848180770874023, 0.002244234085083008, 0.0026036500930786133, 0.0029630661010742188, 0.0033224821090698242, 0.0036818981170654297, 0.004041314125061035, 0.004400730133056641, 0.004760146141052246, 0.0051195621490478516, 0.005478978157043457, 0.0058383941650390625, 0.006197810173034668, 0.0065572261810302734, 0.006916642189025879, 0.007276058197021484, 0.00763547420501709, 0.007994890213012695, 0.0083543062210083, 0.008713722229003906, 0.009073138236999512, 0.009432554244995117, 0.009791970252990723, 0.010151386260986328, 0.010510802268981934, 0.010870218276977539, 0.011229634284973145, 0.01158905029296875]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 11.0, 7.0, 16.0, 16.0, 35.0, 38.0, 57.0, 79.0, 132.0, 165.0, 253.0, 318.0, 551.0, 769.0, 1078.0, 1820.0, 2649.0, 4220.0, 6904.0, 11074.0, 19029.0, 33117.0, 60068.0, 115076.0, 240747.0, 569518.0, 1614542.0, 856783.0, 326659.0, 150917.0, 76663.0, 41447.0, 23318.0, 13472.0, 8258.0, 5113.0, 3174.0, 2053.0, 1317.0, 852.0, 610.0, 399.0, 277.0, 219.0, 146.0, 105.0, 76.0, 46.0, 28.0, 25.0, 16.0, 11.0, 9.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0211029052734375, -0.020415306091308594, -0.019727706909179688, -0.01904010772705078, -0.018352508544921875, -0.01766490936279297, -0.016977310180664062, -0.016289710998535156, -0.01560211181640625, -0.014914512634277344, -0.014226913452148438, -0.013539314270019531, -0.012851715087890625, -0.012164115905761719, -0.011476516723632812, -0.010788917541503906, -0.010101318359375, -0.009413719177246094, -0.008726119995117188, -0.008038520812988281, -0.007350921630859375, -0.006663322448730469, -0.0059757232666015625, -0.005288124084472656, -0.00460052490234375, -0.003912925720214844, -0.0032253265380859375, -0.0025377273559570312, -0.001850128173828125, -0.0011625289916992188, -0.0004749298095703125, 0.00021266937255859375, 0.0009002685546875, 0.0015878677368164062, 0.0022754669189453125, 0.0029630661010742188, 0.003650665283203125, 0.004338264465332031, 0.0050258636474609375, 0.005713462829589844, 0.00640106201171875, 0.007088661193847656, 0.0077762603759765625, 0.008463859558105469, 0.009151458740234375, 0.009839057922363281, 0.010526657104492188, 0.011214256286621094, 0.01190185546875, 0.012589454650878906, 0.013277053833007812, 0.013964653015136719, 0.014652252197265625, 0.015339851379394531, 0.016027450561523438, 0.016715049743652344, 0.01740264892578125, 0.018090248107910156, 0.018777847290039062, 0.01946544647216797, 0.020153045654296875, 0.02084064483642578, 0.021528244018554688, 0.022215843200683594, 0.0229034423828125]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 8.0, 5.0, 3.0, 10.0, 8.0, 8.0, 9.0, 17.0, 20.0, 23.0, 24.0, 26.0, 51.0, 56.0, 58.0, 73.0, 73.0, 124.0, 134.0, 148.0, 195.0, 209.0, 257.0, 261.0, 318.0, 304.0, 258.0, 239.0, 190.0, 169.0, 144.0, 132.0, 107.0, 85.0, 54.0, 68.0, 30.0, 39.0, 35.0, 16.0, 27.0, 12.0, 10.0, 4.0, 7.0, 12.0, 3.0, 5.0, 2.0, 3.0, 1.0, 5.0], "bins": [-0.007114410400390625, -0.00691986083984375, -0.006725311279296875, -0.00653076171875, -0.006336212158203125, -0.00614166259765625, -0.005947113037109375, -0.0057525634765625, -0.005558013916015625, -0.00536346435546875, -0.005168914794921875, -0.004974365234375, -0.004779815673828125, -0.00458526611328125, -0.004390716552734375, -0.0041961669921875, -0.004001617431640625, -0.00380706787109375, -0.003612518310546875, -0.00341796875, -0.003223419189453125, -0.00302886962890625, -0.002834320068359375, -0.0026397705078125, -0.002445220947265625, -0.00225067138671875, -0.002056121826171875, -0.001861572265625, -0.001667022705078125, -0.00147247314453125, -0.001277923583984375, -0.0010833740234375, -0.000888824462890625, -0.00069427490234375, -0.000499725341796875, -0.00030517578125, -0.000110626220703125, 8.392333984375e-05, 0.000278472900390625, 0.0004730224609375, 0.000667572021484375, 0.00086212158203125, 0.001056671142578125, 0.001251220703125, 0.001445770263671875, 0.00164031982421875, 0.001834869384765625, 0.0020294189453125, 0.002223968505859375, 0.00241851806640625, 0.002613067626953125, 0.0028076171875, 0.003002166748046875, 0.00319671630859375, 0.003391265869140625, 0.0035858154296875, 0.003780364990234375, 0.00397491455078125, 0.004169464111328125, 0.004364013671875, 0.004558563232421875, 0.00475311279296875, 0.004947662353515625, 0.0051422119140625, 0.005336761474609375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 9.0, 11.0, 14.0, 18.0, 29.0, 31.0, 60.0, 62.0, 108.0, 138.0, 137.0, 114.0, 82.0, 45.0, 40.0, 27.0, 22.0, 11.0, 9.0, 13.0, 8.0, 3.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.028018012642860413, -0.027194973081350327, -0.02637193538248539, -0.025548895820975304, -0.024725858122110367, -0.02390281856060028, -0.023079778999090195, -0.02225673943758011, -0.021433701738715172, -0.020610662177205086, -0.01978762447834015, -0.018964584916830063, -0.018141545355319977, -0.01731850765645504, -0.016495468094944954, -0.015672430396080017, -0.014849390834569931, -0.01402635220438242, -0.013203313574194908, -0.012380274012684822, -0.01155723538249731, -0.0107341967523098, -0.009911157190799713, -0.009088118560612202, -0.00826507993042469, -0.007442041300237179, -0.00661900220438838, -0.005795963108539581, -0.00497292447835207, -0.004149885848164558, -0.0033268467523157597, -0.002503807656466961, -0.0016807708889245987, -0.0008577320259064436, -3.46931628882885e-05, 0.0007883457001298666, 0.0016113845631480217, 0.002434423193335533, 0.003257462289184332, 0.004080501385033131, 0.004903540015220642, 0.0057265786454081535, 0.006549617741256952, 0.007372656837105751, 0.008195695467293262, 0.009018734097480774, 0.00984177365899086, 0.010664812289178371, 0.011487850919365883, 0.012310889549553394, 0.013133928179740906, 0.013956967741250992, 0.014780006371438503, 0.015603045001626015, 0.0164260845631361, 0.017249122262001038, 0.018072161823511124, 0.01889520138502121, 0.019718239083886147, 0.020541278645396233, 0.02136431634426117, 0.022187355905771255, 0.02301039546728134, 0.023833435028791428, 0.024656472727656364]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 12.0, 7.0, 11.0, 24.0, 24.0, 21.0, 23.0, 32.0, 35.0, 30.0, 46.0, 32.0, 35.0, 33.0, 41.0, 35.0, 39.0, 38.0, 36.0, 45.0, 42.0, 45.0, 32.0, 32.0, 31.0, 25.0, 28.0, 16.0, 15.0, 19.0, 19.0, 14.0, 14.0, 7.0, 16.0, 8.0, 5.0, 4.0, 4.0, 3.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011003697291016579, -0.010626931674778461, -0.010250166989862919, -0.009873401373624802, -0.009496635757386684, -0.009119870141148567, -0.008743105456233025, -0.008366339839994907, -0.00798957422375679, -0.00761280907317996, -0.007236043456941843, -0.006859278306365013, -0.006482512690126896, -0.006105747539550066, -0.005728982388973236, -0.005352216772735119, -0.004975452087819576, -0.004598686937242746, -0.004221921321004629, -0.0038451561704277992, -0.0034683907870203257, -0.003091625403612852, -0.002714860253036022, -0.0023380948696285486, -0.001961329486221075, -0.0015845641028136015, -0.0012077988358214498, -0.000831033568829298, -0.00045426818542182446, -7.750280201435089e-05, 0.000299262348562479, 0.0006760277319699526, 0.0010527921840548515, 0.001429557567462325, 0.0018063228344544768, 0.0021830881014466286, 0.002559853484854102, 0.0029366188682615757, 0.0033133840188384056, 0.003690149402245879, 0.004066914785653353, 0.004443679936230183, 0.0048204455524683, 0.00519721070304513, 0.00557397585362196, 0.005950741469860077, 0.006327506620436907, 0.006704271771013737, 0.007081037387251854, 0.007457802537828684, 0.007834567688405514, 0.008211333304643631, 0.008588098920881748, 0.008964864537119865, 0.009341629222035408, 0.009718394838273525, 0.010095160454511642, 0.01047192607074976, 0.010848690755665302, 0.01122545637190342, 0.011602221988141537, 0.011978987604379654, 0.012355752289295197, 0.012732517905533314, 0.013109282590448856]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 9.0, 13.0, 17.0, 29.0, 42.0, 60.0, 97.0, 124.0, 178.0, 316.0, 434.0, 699.0, 1075.0, 1654.0, 2551.0, 4016.0, 6285.0, 10016.0, 16776.0, 28823.0, 51365.0, 97895.0, 218844.0, 312514.0, 134960.0, 67469.0, 36732.0, 21142.0, 12776.0, 7698.0, 4878.0, 3146.0, 2036.0, 1271.0, 890.0, 590.0, 363.0, 224.0, 186.0, 113.0, 89.0, 41.0, 38.0, 31.0, 20.0, 11.0, 5.0, 3.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.00466156005859375, -0.0045122504234313965, -0.004362940788269043, -0.0042136311531066895, -0.004064321517944336, -0.003915011882781982, -0.003765702247619629, -0.0036163926124572754, -0.003467082977294922, -0.0033177733421325684, -0.003168463706970215, -0.0030191540718078613, -0.002869844436645508, -0.0027205348014831543, -0.0025712251663208008, -0.0024219155311584473, -0.0022726058959960938, -0.0021232962608337402, -0.0019739866256713867, -0.0018246769905090332, -0.0016753673553466797, -0.0015260577201843262, -0.0013767480850219727, -0.0012274384498596191, -0.0010781288146972656, -0.0009288191795349121, -0.0007795095443725586, -0.0006301999092102051, -0.00048089027404785156, -0.00033158063888549805, -0.00018227100372314453, -3.2961368560791016e-05, 0.0001163482666015625, 0.000265657901763916, 0.00041496753692626953, 0.000564277172088623, 0.0007135868072509766, 0.0008628964424133301, 0.0010122060775756836, 0.0011615157127380371, 0.0013108253479003906, 0.0014601349830627441, 0.0016094446182250977, 0.0017587542533874512, 0.0019080638885498047, 0.002057373523712158, 0.0022066831588745117, 0.0023559927940368652, 0.0025053024291992188, 0.0026546120643615723, 0.0028039216995239258, 0.0029532313346862793, 0.003102540969848633, 0.0032518506050109863, 0.00340116024017334, 0.0035504698753356934, 0.003699779510498047, 0.0038490891456604004, 0.003998398780822754, 0.004147708415985107, 0.004297018051147461, 0.0044463276863098145, 0.004595637321472168, 0.0047449469566345215, 0.004894256591796875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 3.0, 5.0, 5.0, 4.0, 5.0, 8.0, 11.0, 20.0, 26.0, 15.0, 21.0, 33.0, 41.0, 32.0, 33.0, 37.0, 38.0, 53.0, 42.0, 45.0, 36.0, 40.0, 39.0, 38.0, 44.0, 38.0, 39.0, 33.0, 26.0, 32.0, 24.0, 22.0, 21.0, 15.0, 13.0, 12.0, 10.0, 15.0, 10.0, 8.0, 2.0, 2.0, 4.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0119476318359375, -0.011534452438354492, -0.011121273040771484, -0.010708093643188477, -0.010294914245605469, -0.009881734848022461, -0.009468555450439453, -0.009055376052856445, -0.008642196655273438, -0.00822901725769043, -0.007815837860107422, -0.007402658462524414, -0.006989479064941406, -0.0065762996673583984, -0.006163120269775391, -0.005749940872192383, -0.005336761474609375, -0.004923582077026367, -0.004510402679443359, -0.0040972232818603516, -0.0036840438842773438, -0.003270864486694336, -0.002857685089111328, -0.0024445056915283203, -0.0020313262939453125, -0.0016181468963623047, -0.0012049674987792969, -0.0007917881011962891, -0.00037860870361328125, 3.457069396972656e-05, 0.0004477500915527344, 0.0008609294891357422, 0.00127410888671875, 0.0016872882843017578, 0.0021004676818847656, 0.0025136470794677734, 0.0029268264770507812, 0.003340005874633789, 0.003753185272216797, 0.004166364669799805, 0.0045795440673828125, 0.00499272346496582, 0.005405902862548828, 0.005819082260131836, 0.006232261657714844, 0.0066454410552978516, 0.007058620452880859, 0.007471799850463867, 0.007884979248046875, 0.008298158645629883, 0.00871133804321289, 0.009124517440795898, 0.009537696838378906, 0.009950876235961914, 0.010364055633544922, 0.01077723503112793, 0.011190414428710938, 0.011603593826293945, 0.012016773223876953, 0.012429952621459961, 0.012843132019042969, 0.013256311416625977, 0.013669490814208984, 0.014082670211791992, 0.014495849609375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [5.0, 5.0, 0.0, 4.0, 9.0, 6.0, 13.0, 17.0, 15.0, 24.0, 36.0, 59.0, 70.0, 100.0, 130.0, 189.0, 289.0, 379.0, 580.0, 865.0, 1297.0, 1984.0, 3092.0, 4857.0, 7974.0, 14028.0, 26436.0, 54238.0, 140264.0, 470515.0, 183860.0, 65992.0, 30834.0, 15897.0, 9047.0, 5404.0, 3394.0, 2159.0, 1402.0, 965.0, 608.0, 460.0, 304.0, 224.0, 166.0, 94.0, 72.0, 53.0, 52.0, 35.0, 17.0, 15.0, 10.0, 6.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.006839752197265625, -0.006608784198760986, -0.006377816200256348, -0.006146848201751709, -0.00591588020324707, -0.005684912204742432, -0.005453944206237793, -0.005222976207733154, -0.004992008209228516, -0.004761040210723877, -0.004530072212219238, -0.0042991042137146, -0.004068136215209961, -0.0038371682167053223, -0.0036062002182006836, -0.003375232219696045, -0.0031442642211914062, -0.0029132962226867676, -0.002682328224182129, -0.0024513602256774902, -0.0022203922271728516, -0.001989424228668213, -0.0017584562301635742, -0.0015274882316589355, -0.0012965202331542969, -0.0010655522346496582, -0.0008345842361450195, -0.0006036162376403809, -0.0003726482391357422, -0.00014168024063110352, 8.928775787353516e-05, 0.00032025575637817383, 0.0005512237548828125, 0.0007821917533874512, 0.0010131597518920898, 0.0012441277503967285, 0.0014750957489013672, 0.0017060637474060059, 0.0019370317459106445, 0.002167999744415283, 0.002398967742919922, 0.0026299357414245605, 0.0028609037399291992, 0.003091871738433838, 0.0033228397369384766, 0.0035538077354431152, 0.003784775733947754, 0.004015743732452393, 0.004246711730957031, 0.00447767972946167, 0.004708647727966309, 0.004939615726470947, 0.005170583724975586, 0.005401551723480225, 0.005632519721984863, 0.005863487720489502, 0.006094455718994141, 0.006325423717498779, 0.006556391716003418, 0.006787359714508057, 0.007018327713012695, 0.007249295711517334, 0.007480263710021973, 0.007711231708526611, 0.00794219970703125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 10.0, 7.0, 11.0, 5.0, 12.0, 15.0, 16.0, 18.0, 17.0, 25.0, 26.0, 21.0, 24.0, 37.0, 28.0, 36.0, 40.0, 30.0, 46.0, 42.0, 41.0, 44.0, 49.0, 42.0, 42.0, 37.0, 20.0, 31.0, 25.0, 27.0, 22.0, 21.0, 27.0, 8.0, 19.0, 18.0, 14.0, 9.0, 10.0, 4.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007404327392578125, -0.007162988185882568, -0.006921648979187012, -0.006680309772491455, -0.0064389705657958984, -0.006197631359100342, -0.005956292152404785, -0.0057149529457092285, -0.005473613739013672, -0.005232274532318115, -0.004990935325622559, -0.004749596118927002, -0.004508256912231445, -0.004266917705535889, -0.004025578498840332, -0.0037842392921447754, -0.0035429000854492188, -0.003301560878753662, -0.0030602216720581055, -0.002818882465362549, -0.002577543258666992, -0.0023362040519714355, -0.002094864845275879, -0.0018535256385803223, -0.0016121864318847656, -0.001370847225189209, -0.0011295080184936523, -0.0008881688117980957, -0.0006468296051025391, -0.0004054903984069824, -0.00016415119171142578, 7.718801498413086e-05, 0.0003185272216796875, 0.0005598664283752441, 0.0008012056350708008, 0.0010425448417663574, 0.001283884048461914, 0.0015252232551574707, 0.0017665624618530273, 0.002007901668548584, 0.0022492408752441406, 0.0024905800819396973, 0.002731919288635254, 0.0029732584953308105, 0.003214597702026367, 0.003455936908721924, 0.0036972761154174805, 0.003938615322113037, 0.004179954528808594, 0.00442129373550415, 0.004662632942199707, 0.004903972148895264, 0.00514531135559082, 0.005386650562286377, 0.005627989768981934, 0.00586932897567749, 0.006110668182373047, 0.0063520073890686035, 0.00659334659576416, 0.006834685802459717, 0.0070760250091552734, 0.00731736421585083, 0.007558703422546387, 0.007800042629241943, 0.0080413818359375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 3.0, 2.0, 5.0, 12.0, 10.0, 22.0, 27.0, 42.0, 44.0, 69.0, 97.0, 135.0, 213.0, 312.0, 494.0, 731.0, 1145.0, 1785.0, 3003.0, 5138.0, 9820.0, 19640.0, 45721.0, 145461.0, 599780.0, 131592.0, 42578.0, 18514.0, 9123.0, 5096.0, 2877.0, 1725.0, 1119.0, 736.0, 448.0, 312.0, 215.0, 146.0, 121.0, 77.0, 44.0, 30.0, 28.0, 22.0, 11.0, 11.0, 9.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0004878044128417969, -0.00047179311513900757, -0.00045578181743621826, -0.00043977051973342896, -0.00042375922203063965, -0.00040774792432785034, -0.00039173662662506104, -0.00037572532892227173, -0.0003597140312194824, -0.0003437027335166931, -0.0003276914358139038, -0.0003116801381111145, -0.0002956688404083252, -0.0002796575427055359, -0.0002636462450027466, -0.0002476349472999573, -0.00023162364959716797, -0.00021561235189437866, -0.00019960105419158936, -0.00018358975648880005, -0.00016757845878601074, -0.00015156716108322144, -0.00013555586338043213, -0.00011954456567764282, -0.00010353326797485352, -8.752197027206421e-05, -7.15106725692749e-05, -5.5499374866485596e-05, -3.948807716369629e-05, -2.3476779460906982e-05, -7.465481758117676e-06, 8.545815944671631e-06, 2.4557113647460938e-05, 4.0568411350250244e-05, 5.657970905303955e-05, 7.259100675582886e-05, 8.860230445861816e-05, 0.00010461360216140747, 0.00012062489986419678, 0.00013663619756698608, 0.0001526474952697754, 0.0001686587929725647, 0.000184670090675354, 0.0002006813883781433, 0.00021669268608093262, 0.00023270398378372192, 0.00024871528148651123, 0.00026472657918930054, 0.00028073787689208984, 0.00029674917459487915, 0.00031276047229766846, 0.00032877177000045776, 0.00034478306770324707, 0.0003607943654060364, 0.0003768056631088257, 0.000392816960811615, 0.0004088282585144043, 0.0004248395562171936, 0.0004408508539199829, 0.0004568621516227722, 0.0004728734493255615, 0.0004888847470283508, 0.0005048960447311401, 0.0005209073424339294, 0.0005369186401367188]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 0.0, 5.0, 2.0, 9.0, 1.0, 10.0, 10.0, 0.0, 12.0, 10.0, 22.0, 15.0, 25.0, 38.0, 0.0, 42.0, 52.0, 45.0, 65.0, 89.0, 64.0, 0.0, 73.0, 77.0, 55.0, 78.0, 47.0, 39.0, 0.0, 24.0, 20.0, 18.0, 12.0, 13.0, 6.0, 0.0, 5.0, 4.0, 2.0, 5.0, 5.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7881393432617188e-06, -1.7369166016578674e-06, -1.6856938600540161e-06, -1.6344711184501648e-06, -1.5832483768463135e-06, -1.5320256352424622e-06, -1.4808028936386108e-06, -1.4295801520347595e-06, -1.3783574104309082e-06, -1.3271346688270569e-06, -1.2759119272232056e-06, -1.2246891856193542e-06, -1.173466444015503e-06, -1.1222437024116516e-06, -1.0710209608078003e-06, -1.019798219203949e-06, -9.685754776000977e-07, -9.173527359962463e-07, -8.66129994392395e-07, -8.149072527885437e-07, -7.636845111846924e-07, -7.124617695808411e-07, -6.612390279769897e-07, -6.100162863731384e-07, -5.587935447692871e-07, -5.075708031654358e-07, -4.5634806156158447e-07, -4.0512531995773315e-07, -3.5390257835388184e-07, -3.026798367500305e-07, -2.514570951461792e-07, -2.0023435354232788e-07, -1.4901161193847656e-07, -9.778887033462524e-08, -4.6566128730773926e-08, 4.6566128730773926e-09, 5.587935447692871e-08, 1.0710209608078003e-07, 1.5832483768463135e-07, 2.0954757928848267e-07, 2.60770320892334e-07, 3.119930624961853e-07, 3.632158041000366e-07, 4.1443854570388794e-07, 4.6566128730773926e-07, 5.168840289115906e-07, 5.681067705154419e-07, 6.193295121192932e-07, 6.705522537231445e-07, 7.217749953269958e-07, 7.729977369308472e-07, 8.242204785346985e-07, 8.754432201385498e-07, 9.266659617424011e-07, 9.778887033462524e-07, 1.0291114449501038e-06, 1.080334186553955e-06, 1.1315569281578064e-06, 1.1827796697616577e-06, 1.234002411365509e-06, 1.2852251529693604e-06, 1.3364478945732117e-06, 1.387670636177063e-06, 1.4388933777809143e-06, 1.4901161193847656e-06]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 6.0, 6.0, 9.0, 25.0, 26.0, 33.0, 63.0, 99.0, 141.0, 171.0, 304.0, 472.0, 851.0, 1385.0, 2594.0, 4962.0, 10090.0, 22689.0, 57980.0, 195414.0, 560028.0, 117591.0, 40347.0, 16405.0, 7801.0, 3920.0, 2130.0, 1184.0, 687.0, 414.0, 231.0, 159.0, 112.0, 56.0, 58.0, 32.0, 25.0, 14.0, 7.0, 15.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0008749961853027344, -0.0008487328886985779, -0.0008224695920944214, -0.0007962062954902649, -0.0007699429988861084, -0.0007436797022819519, -0.0007174164056777954, -0.0006911531090736389, -0.0006648898124694824, -0.0006386265158653259, -0.0006123632192611694, -0.0005860999226570129, -0.0005598366260528564, -0.0005335733294487, -0.0005073100328445435, -0.00048104673624038696, -0.00045478343963623047, -0.000428520143032074, -0.0004022568464279175, -0.000375993549823761, -0.0003497302532196045, -0.000323466956615448, -0.0002972036600112915, -0.000270940363407135, -0.0002446770668029785, -0.00021841377019882202, -0.00019215047359466553, -0.00016588717699050903, -0.00013962388038635254, -0.00011336058378219604, -8.709728717803955e-05, -6.083399057388306e-05, -3.457069396972656e-05, -8.307397365570068e-06, 1.7955899238586426e-05, 4.421919584274292e-05, 7.048249244689941e-05, 9.674578905105591e-05, 0.0001230090856552124, 0.0001492723822593689, 0.0001755356788635254, 0.00020179897546768188, 0.00022806227207183838, 0.0002543255686759949, 0.00028058886528015137, 0.00030685216188430786, 0.00033311545848846436, 0.00035937875509262085, 0.00038564205169677734, 0.00041190534830093384, 0.00043816864490509033, 0.0004644319415092468, 0.0004906952381134033, 0.0005169585347175598, 0.0005432218313217163, 0.0005694851279258728, 0.0005957484245300293, 0.0006220117211341858, 0.0006482750177383423, 0.0006745383143424988, 0.0007008016109466553, 0.0007270649075508118, 0.0007533282041549683, 0.0007795915007591248, 0.0008058547973632812]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 4.0, 1.0, 5.0, 6.0, 2.0, 8.0, 13.0, 16.0, 15.0, 16.0, 33.0, 20.0, 45.0, 46.0, 45.0, 65.0, 71.0, 122.0, 101.0, 88.0, 40.0, 45.0, 48.0, 32.0, 21.0, 22.0, 16.0, 7.0, 6.0, 9.0, 6.0, 4.0, 2.0, 4.0, 5.0, 6.0, 7.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019288063049316406, -0.00018685683608055115, -0.00018083304166793823, -0.00017480924725532532, -0.0001687854528427124, -0.0001627616584300995, -0.00015673786401748657, -0.00015071406960487366, -0.00014469027519226074, -0.00013866648077964783, -0.0001326426863670349, -0.000126618891954422, -0.00012059509754180908, -0.00011457130312919617, -0.00010854750871658325, -0.00010252371430397034, -9.649991989135742e-05, -9.047612547874451e-05, -8.445233106613159e-05, -7.842853665351868e-05, -7.240474224090576e-05, -6.638094782829285e-05, -6.035715341567993e-05, -5.4333359003067017e-05, -4.83095645904541e-05, -4.2285770177841187e-05, -3.626197576522827e-05, -3.0238181352615356e-05, -2.421438694000244e-05, -1.8190592527389526e-05, -1.2166798114776611e-05, -6.143003702163696e-06, -1.1920928955078125e-07, 5.904585123062134e-06, 1.1928379535675049e-05, 1.7952173948287964e-05, 2.397596836090088e-05, 2.9999762773513794e-05, 3.602355718612671e-05, 4.2047351598739624e-05, 4.807114601135254e-05, 5.4094940423965454e-05, 6.011873483657837e-05, 6.614252924919128e-05, 7.21663236618042e-05, 7.819011807441711e-05, 8.421391248703003e-05, 9.023770689964294e-05, 9.626150131225586e-05, 0.00010228529572486877, 0.00010830909013748169, 0.0001143328845500946, 0.00012035667896270752, 0.00012638047337532043, 0.00013240426778793335, 0.00013842806220054626, 0.00014445185661315918, 0.0001504756510257721, 0.000156499445438385, 0.00016252323985099792, 0.00016854703426361084, 0.00017457082867622375, 0.00018059462308883667, 0.00018661841750144958, 0.0001926422119140625]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 3.0, 6.0, 11.0, 10.0, 16.0, 24.0, 31.0, 34.0, 50.0, 71.0, 105.0, 143.0, 132.0, 109.0, 79.0, 46.0, 31.0, 32.0, 17.0, 14.0, 7.0, 15.0, 9.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027803147211670876, -0.027006762102246284, -0.026210378855466843, -0.02541399374604225, -0.02461760863661766, -0.02382122352719307, -0.02302483841776848, -0.022228455170989037, -0.021432070061564445, -0.020635684952139854, -0.019839301705360413, -0.01904291659593582, -0.01824653148651123, -0.01745014637708664, -0.01665376126766205, -0.015857378020882607, -0.015060992911458015, -0.014264607802033424, -0.013468223623931408, -0.012671839445829391, -0.0118754543364048, -0.01107906922698021, -0.010282685048878193, -0.009486300870776176, -0.008689915761351585, -0.007893530651926994, -0.007097146473824978, -0.006300761830061674, -0.00550437718629837, -0.004707992542535067, -0.003911607898771763, -0.003115223255008459, -0.002318836748600006, -0.0015224521048367023, -0.0007260674610733986, 7.031718268990517e-05, 0.0008667018264532089, 0.0016630864702165127, 0.0024594711139798164, 0.00325585575774312, 0.004052240401506424, 0.004848625045269728, 0.0056450096890330315, 0.006441394332796335, 0.007237778976559639, 0.00803416408598423, 0.008830548264086246, 0.009626932442188263, 0.010423317551612854, 0.011219702661037445, 0.012016086839139462, 0.012812471017241478, 0.013608856126666069, 0.01440524123609066, 0.015201625414192677, 0.015998009592294693, 0.016794394701719284, 0.017590779811143875, 0.018387164920568466, 0.019183548167347908, 0.0199799332767725, 0.02077631838619709, 0.021572701632976532, 0.022369086742401123, 0.023165471851825714]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 7.0, 5.0, 11.0, 8.0, 11.0, 24.0, 25.0, 21.0, 25.0, 30.0, 36.0, 29.0, 41.0, 37.0, 34.0, 33.0, 39.0, 37.0, 38.0, 39.0, 36.0, 45.0, 42.0, 44.0, 32.0, 32.0, 32.0, 26.0, 26.0, 16.0, 16.0, 20.0, 18.0, 15.0, 12.0, 9.0, 14.0, 9.0, 5.0, 4.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010847250930964947, -0.010474572889506817, -0.010101893916726112, -0.009729215875267982, -0.009356537833809853, -0.008983859792351723, -0.008611180819571018, -0.008238502778112888, -0.007865823805332184, -0.007493145298212767, -0.007120467256754637, -0.00674778874963522, -0.00637511070817709, -0.0060024322010576725, -0.005629753693938255, -0.005257075652480125, -0.0048843976110219955, -0.004511719103902578, -0.0041390410624444485, -0.0037663625553250313, -0.0033936842810362577, -0.003021006006747484, -0.002648327499628067, -0.0022756492253392935, -0.00190297095105052, -0.0015302926767617464, -0.001157614286057651, -0.0007849358953535557, -0.00041225762106478214, -3.9579346776008606e-05, 0.0003330991603434086, 0.0007057774346321821, 0.001078454777598381, 0.0014511330518871546, 0.00182381144259125, 0.0021964898332953453, 0.002569168107584119, 0.0029418463818728924, 0.0033145248889923096, 0.003687203163281083, 0.004059881437569857, 0.004432559944689274, 0.004805237986147404, 0.005177916493266821, 0.005550595000386238, 0.005923273041844368, 0.006295951548963785, 0.006668630056083202, 0.007041308097541332, 0.0074139866046607494, 0.007786664646118879, 0.008159343153238297, 0.008532021194696426, 0.008904699236154556, 0.00927737820893526, 0.00965005625039339, 0.010022735223174095, 0.010395413264632225, 0.01076809223741293, 0.01114077027887106, 0.01151344832032919, 0.011886127293109894, 0.012258805334568024, 0.012631483376026154, 0.013004161417484283]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 13.0, 16.0, 33.0, 41.0, 49.0, 93.0, 134.0, 193.0, 326.0, 447.0, 694.0, 1055.0, 1597.0, 2433.0, 3836.0, 6003.0, 9295.0, 14792.0, 23796.0, 39190.0, 68056.0, 129248.0, 280890.0, 217805.0, 103510.0, 56475.0, 33015.0, 20679.0, 12579.0, 7939.0, 5102.0, 3117.0, 2091.0, 1291.0, 910.0, 635.0, 406.0, 279.0, 164.0, 104.0, 78.0, 50.0, 35.0, 18.0, 10.0, 16.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0254974365234375, -0.02472090721130371, -0.023944377899169922, -0.023167848587036133, -0.022391319274902344, -0.021614789962768555, -0.020838260650634766, -0.020061731338500977, -0.019285202026367188, -0.0185086727142334, -0.01773214340209961, -0.01695561408996582, -0.01617908477783203, -0.015402555465698242, -0.014626026153564453, -0.013849496841430664, -0.013072967529296875, -0.012296438217163086, -0.011519908905029297, -0.010743379592895508, -0.009966850280761719, -0.00919032096862793, -0.00841379165649414, -0.0076372623443603516, -0.0068607330322265625, -0.0060842037200927734, -0.005307674407958984, -0.004531145095825195, -0.0037546157836914062, -0.002978086471557617, -0.002201557159423828, -0.001425027847290039, -0.00064849853515625, 0.00012803077697753906, 0.0009045600891113281, 0.0016810894012451172, 0.0024576187133789062, 0.0032341480255126953, 0.004010677337646484, 0.0047872066497802734, 0.0055637359619140625, 0.0063402652740478516, 0.007116794586181641, 0.00789332389831543, 0.008669853210449219, 0.009446382522583008, 0.010222911834716797, 0.010999441146850586, 0.011775970458984375, 0.012552499771118164, 0.013329029083251953, 0.014105558395385742, 0.014882087707519531, 0.01565861701965332, 0.01643514633178711, 0.0172116756439209, 0.017988204956054688, 0.018764734268188477, 0.019541263580322266, 0.020317792892456055, 0.021094322204589844, 0.021870851516723633, 0.022647380828857422, 0.02342391014099121, 0.024200439453125]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 8.0, 5.0, 17.0, 28.0, 18.0, 24.0, 23.0, 30.0, 34.0, 24.0, 44.0, 35.0, 30.0, 37.0, 39.0, 37.0, 47.0, 49.0, 39.0, 42.0, 43.0, 40.0, 34.0, 36.0, 28.0, 31.0, 16.0, 29.0, 22.0, 16.0, 19.0, 13.0, 12.0, 10.0, 5.0, 5.0, 3.0, 5.0, 2.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0097808837890625, -0.009441375732421875, -0.00910186767578125, -0.008762359619140625, -0.0084228515625, -0.008083343505859375, -0.00774383544921875, -0.007404327392578125, -0.0070648193359375, -0.006725311279296875, -0.00638580322265625, -0.006046295166015625, -0.005706787109375, -0.005367279052734375, -0.00502777099609375, -0.004688262939453125, -0.0043487548828125, -0.004009246826171875, -0.00366973876953125, -0.003330230712890625, -0.00299072265625, -0.002651214599609375, -0.00231170654296875, -0.001972198486328125, -0.0016326904296875, -0.001293182373046875, -0.00095367431640625, -0.000614166259765625, -0.000274658203125, 6.4849853515625e-05, 0.00040435791015625, 0.000743865966796875, 0.0010833740234375, 0.001422882080078125, 0.00176239013671875, 0.002101898193359375, 0.00244140625, 0.002780914306640625, 0.00312042236328125, 0.003459930419921875, 0.0037994384765625, 0.004138946533203125, 0.00447845458984375, 0.004817962646484375, 0.005157470703125, 0.005496978759765625, 0.00583648681640625, 0.006175994873046875, 0.0065155029296875, 0.006855010986328125, 0.00719451904296875, 0.007534027099609375, 0.00787353515625, 0.008213043212890625, 0.00855255126953125, 0.008892059326171875, 0.0092315673828125, 0.009571075439453125, 0.00991058349609375, 0.010250091552734375, 0.010589599609375, 0.010929107666015625, 0.01126861572265625, 0.011608123779296875, 0.0119476318359375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 9.0, 13.0, 10.0, 27.0, 39.0, 77.0, 111.0, 150.0, 232.0, 388.0, 569.0, 900.0, 1436.0, 2240.0, 3534.0, 5867.0, 9628.0, 16155.0, 27436.0, 47883.0, 87770.0, 178374.0, 321885.0, 157269.0, 79355.0, 43897.0, 25303.0, 14672.0, 8780.0, 5498.0, 3333.0, 2105.0, 1285.0, 774.0, 550.0, 315.0, 242.0, 157.0, 103.0, 69.0, 41.0, 32.0, 16.0, 9.0, 6.0, 6.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0265655517578125, -0.02577066421508789, -0.02497577667236328, -0.024180889129638672, -0.023386001586914062, -0.022591114044189453, -0.021796226501464844, -0.021001338958740234, -0.020206451416015625, -0.019411563873291016, -0.018616676330566406, -0.017821788787841797, -0.017026901245117188, -0.016232013702392578, -0.015437126159667969, -0.01464223861694336, -0.01384735107421875, -0.01305246353149414, -0.012257575988769531, -0.011462688446044922, -0.010667800903320312, -0.009872913360595703, -0.009078025817871094, -0.008283138275146484, -0.007488250732421875, -0.006693363189697266, -0.005898475646972656, -0.005103588104248047, -0.0043087005615234375, -0.003513813018798828, -0.0027189254760742188, -0.0019240379333496094, -0.001129150390625, -0.0003342628479003906, 0.00046062469482421875, 0.0012555122375488281, 0.0020503997802734375, 0.002845287322998047, 0.0036401748657226562, 0.004435062408447266, 0.005229949951171875, 0.006024837493896484, 0.006819725036621094, 0.007614612579345703, 0.008409500122070312, 0.009204387664794922, 0.009999275207519531, 0.01079416275024414, 0.01158905029296875, 0.01238393783569336, 0.013178825378417969, 0.013973712921142578, 0.014768600463867188, 0.015563488006591797, 0.016358375549316406, 0.017153263092041016, 0.017948150634765625, 0.018743038177490234, 0.019537925720214844, 0.020332813262939453, 0.021127700805664062, 0.021922588348388672, 0.02271747589111328, 0.02351236343383789, 0.0243072509765625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 7.0, 1.0, 5.0, 6.0, 5.0, 7.0, 12.0, 12.0, 16.0, 11.0, 16.0, 22.0, 14.0, 31.0, 25.0, 25.0, 31.0, 28.0, 45.0, 40.0, 27.0, 46.0, 33.0, 34.0, 28.0, 49.0, 35.0, 32.0, 39.0, 29.0, 37.0, 35.0, 29.0, 27.0, 30.0, 21.0, 19.0, 17.0, 17.0, 13.0, 10.0, 14.0, 5.0, 11.0, 5.0, 4.0, 5.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.00701904296875, -0.006818890571594238, -0.0066187381744384766, -0.006418585777282715, -0.006218433380126953, -0.006018280982971191, -0.00581812858581543, -0.005617976188659668, -0.005417823791503906, -0.0052176713943481445, -0.005017518997192383, -0.004817366600036621, -0.004617214202880859, -0.004417061805725098, -0.004216909408569336, -0.004016757011413574, -0.0038166046142578125, -0.0036164522171020508, -0.003416299819946289, -0.0032161474227905273, -0.0030159950256347656, -0.002815842628479004, -0.002615690231323242, -0.0024155378341674805, -0.0022153854370117188, -0.002015233039855957, -0.0018150806427001953, -0.0016149282455444336, -0.0014147758483886719, -0.0012146234512329102, -0.0010144710540771484, -0.0008143186569213867, -0.000614166259765625, -0.0004140138626098633, -0.00021386146545410156, -1.3709068298339844e-05, 0.00018644332885742188, 0.0003865957260131836, 0.0005867481231689453, 0.000786900520324707, 0.0009870529174804688, 0.0011872053146362305, 0.0013873577117919922, 0.001587510108947754, 0.0017876625061035156, 0.0019878149032592773, 0.002187967300415039, 0.0023881196975708008, 0.0025882720947265625, 0.0027884244918823242, 0.002988576889038086, 0.0031887292861938477, 0.0033888816833496094, 0.003589034080505371, 0.003789186477661133, 0.0039893388748168945, 0.004189491271972656, 0.004389643669128418, 0.00458979606628418, 0.004789948463439941, 0.004990100860595703, 0.005190253257751465, 0.0053904056549072266, 0.005590558052062988, 0.00579071044921875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 5.0, 6.0, 6.0, 16.0, 16.0, 22.0, 35.0, 46.0, 73.0, 115.0, 169.0, 286.0, 420.0, 591.0, 891.0, 1298.0, 2068.0, 3449.0, 6055.0, 12578.0, 29273.0, 117339.0, 778624.0, 54611.0, 19236.0, 9007.0, 4641.0, 2677.0, 1622.0, 1176.0, 733.0, 496.0, 308.0, 213.0, 159.0, 93.0, 66.0, 52.0, 31.0, 17.0, 15.0, 7.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006899833679199219, -0.0006664097309112549, -0.0006428360939025879, -0.0006192624568939209, -0.0005956888198852539, -0.0005721151828765869, -0.0005485415458679199, -0.0005249679088592529, -0.0005013942718505859, -0.00047782063484191895, -0.00045424699783325195, -0.00043067336082458496, -0.00040709972381591797, -0.000383526086807251, -0.000359952449798584, -0.000336378812789917, -0.00031280517578125, -0.000289231538772583, -0.000265657901763916, -0.00024208426475524902, -0.00021851062774658203, -0.00019493699073791504, -0.00017136335372924805, -0.00014778971672058105, -0.00012421607971191406, -0.00010064244270324707, -7.706880569458008e-05, -5.3495168685913086e-05, -2.9921531677246094e-05, -6.3478946685791016e-06, 1.722574234008789e-05, 4.079937934875488e-05, 6.437301635742188e-05, 8.794665336608887e-05, 0.00011152029037475586, 0.00013509392738342285, 0.00015866756439208984, 0.00018224120140075684, 0.00020581483840942383, 0.00022938847541809082, 0.0002529621124267578, 0.0002765357494354248, 0.0003001093864440918, 0.0003236830234527588, 0.0003472566604614258, 0.0003708302974700928, 0.00039440393447875977, 0.00041797757148742676, 0.00044155120849609375, 0.00046512484550476074, 0.0004886984825134277, 0.0005122721195220947, 0.0005358457565307617, 0.0005594193935394287, 0.0005829930305480957, 0.0006065666675567627, 0.0006301403045654297, 0.0006537139415740967, 0.0006772875785827637, 0.0007008612155914307, 0.0007244348526000977, 0.0007480084896087646, 0.0007715821266174316, 0.0007951557636260986, 0.0008187294006347656]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 6.0, 0.0, 0.0, 7.0, 0.0, 0.0, 9.0, 0.0, 15.0, 0.0, 0.0, 23.0, 0.0, 0.0, 31.0, 0.0, 0.0, 65.0, 0.0, 0.0, 72.0, 0.0, 87.0, 0.0, 0.0, 413.0, 0.0, 0.0, 88.0, 0.0, 0.0, 56.0, 0.0, 48.0, 0.0, 0.0, 33.0, 0.0, 0.0, 29.0, 0.0, 0.0, 12.0, 0.0, 0.0, 14.0, 0.0, 5.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.556510925292969e-07, -6.342306733131409e-07, -6.128102540969849e-07, -5.913898348808289e-07, -5.699694156646729e-07, -5.485489964485168e-07, -5.271285772323608e-07, -5.057081580162048e-07, -4.842877388000488e-07, -4.628673195838928e-07, -4.414469003677368e-07, -4.200264811515808e-07, -3.986060619354248e-07, -3.771856427192688e-07, -3.557652235031128e-07, -3.343448042869568e-07, -3.129243850708008e-07, -2.915039658546448e-07, -2.7008354663848877e-07, -2.4866312742233276e-07, -2.2724270820617676e-07, -2.0582228899002075e-07, -1.8440186977386475e-07, -1.6298145055770874e-07, -1.4156103134155273e-07, -1.2014061212539673e-07, -9.872019290924072e-08, -7.729977369308472e-08, -5.587935447692871e-08, -3.4458935260772705e-08, -1.30385160446167e-08, 8.381903171539307e-09, 2.9802322387695312e-08, 5.122274160385132e-08, 7.264316082000732e-08, 9.406358003616333e-08, 1.1548399925231934e-07, 1.3690441846847534e-07, 1.5832483768463135e-07, 1.7974525690078735e-07, 2.0116567611694336e-07, 2.2258609533309937e-07, 2.4400651454925537e-07, 2.654269337654114e-07, 2.868473529815674e-07, 3.082677721977234e-07, 3.296881914138794e-07, 3.511086106300354e-07, 3.725290298461914e-07, 3.939494490623474e-07, 4.153698682785034e-07, 4.367902874946594e-07, 4.5821070671081543e-07, 4.796311259269714e-07, 5.010515451431274e-07, 5.224719643592834e-07, 5.438923835754395e-07, 5.653128027915955e-07, 5.867332220077515e-07, 6.081536412239075e-07, 6.295740604400635e-07, 6.509944796562195e-07, 6.724148988723755e-07, 6.938353180885315e-07, 7.152557373046875e-07]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 1.0, 5.0, 2.0, 7.0, 14.0, 11.0, 12.0, 21.0, 22.0, 37.0, 76.0, 73.0, 107.0, 167.0, 253.0, 348.0, 513.0, 652.0, 1012.0, 1443.0, 2203.0, 3387.0, 5625.0, 10007.0, 20023.0, 49296.0, 692705.0, 178666.0, 40817.0, 17289.0, 9077.0, 5057.0, 3096.0, 2082.0, 1372.0, 885.0, 658.0, 443.0, 322.0, 236.0, 148.0, 128.0, 69.0, 52.0, 50.0, 28.0, 20.0, 10.0, 11.0, 7.0, 8.0, 6.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.0006279945373535156, -0.0006076768040657043, -0.0005873590707778931, -0.0005670413374900818, -0.0005467236042022705, -0.0005264058709144592, -0.000506088137626648, -0.00048577040433883667, -0.0004654526710510254, -0.0004451349377632141, -0.00042481720447540283, -0.00040449947118759155, -0.0003841817378997803, -0.000363864004611969, -0.0003435462713241577, -0.00032322853803634644, -0.00030291080474853516, -0.0002825930714607239, -0.0002622753381729126, -0.00024195760488510132, -0.00022163987159729004, -0.00020132213830947876, -0.00018100440502166748, -0.0001606866717338562, -0.00014036893844604492, -0.00012005120515823364, -9.973347187042236e-05, -7.941573858261108e-05, -5.9098005294799805e-05, -3.8780272006988525e-05, -1.8462538719177246e-05, 1.8551945686340332e-06, 2.2172927856445312e-05, 4.249066114425659e-05, 6.280839443206787e-05, 8.312612771987915e-05, 0.00010344386100769043, 0.0001237615942955017, 0.000144079327583313, 0.00016439706087112427, 0.00018471479415893555, 0.00020503252744674683, 0.0002253502607345581, 0.0002456679940223694, 0.00026598572731018066, 0.00028630346059799194, 0.0003066211938858032, 0.0003269389271736145, 0.0003472566604614258, 0.00036757439374923706, 0.00038789212703704834, 0.0004082098603248596, 0.0004285275936126709, 0.0004488453269004822, 0.00046916306018829346, 0.0004894807934761047, 0.000509798526763916, 0.0005301162600517273, 0.0005504339933395386, 0.0005707517266273499, 0.0005910694599151611, 0.0006113871932029724, 0.0006317049264907837, 0.000652022659778595, 0.0006723403930664062]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 5.0, 6.0, 3.0, 14.0, 12.0, 13.0, 23.0, 31.0, 32.0, 59.0, 101.0, 479.0, 67.0, 42.0, 35.0, 20.0, 11.0, 8.0, 11.0, 5.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001881122589111328, -0.00018206611275672913, -0.00017601996660232544, -0.00016997382044792175, -0.00016392767429351807, -0.00015788152813911438, -0.0001518353819847107, -0.000145789235830307, -0.00013974308967590332, -0.00013369694352149963, -0.00012765079736709595, -0.00012160465121269226, -0.00011555850505828857, -0.00010951235890388489, -0.0001034662127494812, -9.742006659507751e-05, -9.137392044067383e-05, -8.532777428627014e-05, -7.928162813186646e-05, -7.323548197746277e-05, -6.718933582305908e-05, -6.11431896686554e-05, -5.509704351425171e-05, -4.905089735984802e-05, -4.3004751205444336e-05, -3.695860505104065e-05, -3.091245889663696e-05, -2.4866312742233276e-05, -1.882016658782959e-05, -1.2774020433425903e-05, -6.727874279022217e-06, -6.817281246185303e-07, 5.364418029785156e-06, 1.1410564184188843e-05, 1.745671033859253e-05, 2.3502856492996216e-05, 2.9549002647399902e-05, 3.559514880180359e-05, 4.1641294956207275e-05, 4.768744111061096e-05, 5.373358726501465e-05, 5.9779733419418335e-05, 6.582587957382202e-05, 7.187202572822571e-05, 7.79181718826294e-05, 8.396431803703308e-05, 9.001046419143677e-05, 9.605661034584045e-05, 0.00010210275650024414, 0.00010814890265464783, 0.00011419504880905151, 0.0001202411949634552, 0.0001262873411178589, 0.00013233348727226257, 0.00013837963342666626, 0.00014442577958106995, 0.00015047192573547363, 0.00015651807188987732, 0.000162564218044281, 0.0001686103641986847, 0.00017465651035308838, 0.00018070265650749207, 0.00018674880266189575, 0.00019279494881629944, 0.00019884109497070312]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 5.0, 3.0, 6.0, 21.0, 15.0, 14.0, 29.0, 33.0, 56.0, 61.0, 76.0, 103.0, 131.0, 108.0, 92.0, 63.0, 44.0, 35.0, 28.0, 19.0, 16.0, 13.0, 9.0, 6.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02430631034076214, -0.023675663396716118, -0.023045016452670097, -0.022414367645978928, -0.021783720701932907, -0.021153073757886887, -0.020522426813840866, -0.019891779869794846, -0.019261132925748825, -0.018630485981702805, -0.017999839037656784, -0.017369190230965614, -0.016738543286919594, -0.016107896342873573, -0.015477249398827553, -0.014846602454781532, -0.014215953648090363, -0.013585306704044342, -0.012954658828675747, -0.012324011884629726, -0.011693364009261131, -0.01106271706521511, -0.01043207012116909, -0.00980142317712307, -0.009170775301754475, -0.008540128357708454, -0.007909480482339859, -0.0072788335382938385, -0.006648186128586531, -0.006017538718879223, -0.005386891774833202, -0.0047562443651258945, -0.004125598818063736, -0.003494951408356428, -0.002864304231479764, -0.0022336570546031, -0.001603009644895792, -0.0009723622351884842, -0.00034171505831182003, 0.00028893211856484413, 0.000919579528272152, 0.001550226821564138, 0.002180874114856124, 0.002811521291732788, 0.003442168701440096, 0.004072816111147404, 0.004703463055193424, 0.005334110464900732, 0.00596475787460804, 0.006595405284315348, 0.0072260526940226555, 0.007856699638068676, 0.008487347513437271, 0.009117994457483292, 0.009748641401529312, 0.010379288345575333, 0.011009936220943928, 0.011640583164989948, 0.012271231040358543, 0.012901877984404564, 0.013532524928450584, 0.01416317280381918, 0.0147938197478652, 0.015424467623233795, 0.016055114567279816]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 6.0, 3.0, 6.0, 3.0, 4.0, 8.0, 7.0, 10.0, 10.0, 18.0, 18.0, 28.0, 23.0, 32.0, 37.0, 23.0, 28.0, 21.0, 32.0, 37.0, 35.0, 29.0, 38.0, 40.0, 21.0, 38.0, 49.0, 32.0, 48.0, 37.0, 35.0, 32.0, 21.0, 31.0, 19.0, 19.0, 19.0, 15.0, 17.0, 15.0, 11.0, 6.0, 16.0, 11.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0], "bins": [-0.01008532289415598, -0.009762334637343884, -0.009439346380531788, -0.009116357192397118, -0.008793368935585022, -0.008470380678772926, -0.00814739242196083, -0.007824404165148735, -0.007501415908336639, -0.007178427651524544, -0.006855438929051161, -0.006532450672239065, -0.0062094624154269695, -0.005886473692953587, -0.005563485436141491, -0.005240497179329395, -0.004917508456856012, -0.004594520200043917, -0.004271531477570534, -0.003948543220758438, -0.0036255549639463425, -0.003302566474303603, -0.002979577984660864, -0.0026565897278487682, -0.002333601238206029, -0.0020106127485632896, -0.001687624491751194, -0.0013646360021084547, -0.0010416476288810372, -0.0007186592556536198, -0.00039567076601088047, -7.268250919878483e-05, 0.00025030598044395447, 0.0005732943536713719, 0.0008962827851064503, 0.0012192712165415287, 0.0015422595897689462, 0.0018652479629963636, 0.002188236452639103, 0.0025112247094511986, 0.002834213199093938, 0.003157201688736677, 0.003480189945548773, 0.003803178435191512, 0.004126166924834251, 0.004449155181646347, 0.004772143438458443, 0.005095131695270538, 0.005418120417743921, 0.005741108674556017, 0.0060640973970294, 0.0063870856538414955, 0.006710073910653591, 0.007033062167465687, 0.00735605088993907, 0.007679039146751165, 0.008002027869224548, 0.008325016126036644, 0.00864800438284874, 0.008970992639660835, 0.009293981827795506, 0.009616970084607601, 0.009939958341419697, 0.010262946598231792, 0.010585934855043888]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 6.0, 11.0, 17.0, 12.0, 24.0, 37.0, 49.0, 65.0, 104.0, 148.0, 185.0, 270.0, 392.0, 494.0, 749.0, 1142.0, 1809.0, 2801.0, 4325.0, 6722.0, 10676.0, 17412.0, 28836.0, 49249.0, 89505.0, 180980.0, 498457.0, 1806638.0, 962675.0, 257573.0, 115625.0, 62587.0, 35723.0, 21402.0, 13217.0, 8349.0, 5513.0, 3613.0, 2292.0, 1496.0, 954.0, 719.0, 491.0, 303.0, 210.0, 170.0, 106.0, 70.0, 39.0, 14.0, 14.0, 7.0, 10.0, 4.0, 3.0, 0.0, 1.0], "bins": [-0.0168914794921875, -0.01640498638153076, -0.015918493270874023, -0.015432000160217285, -0.014945507049560547, -0.014459013938903809, -0.01397252082824707, -0.013486027717590332, -0.012999534606933594, -0.012513041496276855, -0.012026548385620117, -0.011540055274963379, -0.01105356216430664, -0.010567069053649902, -0.010080575942993164, -0.009594082832336426, -0.009107589721679688, -0.00862109661102295, -0.008134603500366211, -0.007648110389709473, -0.007161617279052734, -0.006675124168395996, -0.006188631057739258, -0.0057021379470825195, -0.005215644836425781, -0.004729151725769043, -0.004242658615112305, -0.0037561655044555664, -0.003269672393798828, -0.00278317928314209, -0.0022966861724853516, -0.0018101930618286133, -0.001323699951171875, -0.0008372068405151367, -0.00035071372985839844, 0.00013577938079833984, 0.0006222724914550781, 0.0011087656021118164, 0.0015952587127685547, 0.002081751823425293, 0.0025682449340820312, 0.0030547380447387695, 0.003541231155395508, 0.004027724266052246, 0.004514217376708984, 0.005000710487365723, 0.005487203598022461, 0.005973696708679199, 0.0064601898193359375, 0.006946682929992676, 0.007433176040649414, 0.007919669151306152, 0.00840616226196289, 0.008892655372619629, 0.009379148483276367, 0.009865641593933105, 0.010352134704589844, 0.010838627815246582, 0.01132512092590332, 0.011811614036560059, 0.012298107147216797, 0.012784600257873535, 0.013271093368530273, 0.013757586479187012, 0.01424407958984375]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 6.0, 6.0, 11.0, 13.0, 9.0, 13.0, 16.0, 19.0, 27.0, 36.0, 29.0, 32.0, 21.0, 31.0, 32.0, 41.0, 33.0, 42.0, 49.0, 39.0, 32.0, 36.0, 38.0, 41.0, 43.0, 44.0, 42.0, 22.0, 20.0, 23.0, 22.0, 14.0, 21.0, 12.0, 11.0, 15.0, 12.0, 10.0, 10.0, 3.0, 10.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0], "bins": [-0.006069183349609375, -0.005878925323486328, -0.005688667297363281, -0.005498409271240234, -0.0053081512451171875, -0.005117893218994141, -0.004927635192871094, -0.004737377166748047, -0.004547119140625, -0.004356861114501953, -0.004166603088378906, -0.003976345062255859, -0.0037860870361328125, -0.0035958290100097656, -0.0034055709838867188, -0.003215312957763672, -0.003025054931640625, -0.002834796905517578, -0.0026445388793945312, -0.0024542808532714844, -0.0022640228271484375, -0.0020737648010253906, -0.0018835067749023438, -0.0016932487487792969, -0.00150299072265625, -0.0013127326965332031, -0.0011224746704101562, -0.0009322166442871094, -0.0007419586181640625, -0.0005517005920410156, -0.00036144256591796875, -0.00017118453979492188, 1.9073486328125e-05, 0.00020933151245117188, 0.00039958953857421875, 0.0005898475646972656, 0.0007801055908203125, 0.0009703636169433594, 0.0011606216430664062, 0.0013508796691894531, 0.0015411376953125, 0.0017313957214355469, 0.0019216537475585938, 0.0021119117736816406, 0.0023021697998046875, 0.0024924278259277344, 0.0026826858520507812, 0.002872943878173828, 0.003063201904296875, 0.003253459930419922, 0.0034437179565429688, 0.0036339759826660156, 0.0038242340087890625, 0.004014492034912109, 0.004204750061035156, 0.004395008087158203, 0.00458526611328125, 0.004775524139404297, 0.004965782165527344, 0.005156040191650391, 0.0053462982177734375, 0.005536556243896484, 0.005726814270019531, 0.005917072296142578, 0.006107330322265625]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 8.0, 11.0, 23.0, 40.0, 47.0, 79.0, 95.0, 172.0, 238.0, 395.0, 613.0, 930.0, 1466.0, 2392.0, 3709.0, 6147.0, 10373.0, 17936.0, 32771.0, 63162.0, 129388.0, 293726.0, 843585.0, 1776961.0, 571107.0, 222193.0, 101703.0, 50477.0, 27004.0, 14987.0, 8552.0, 5233.0, 3123.0, 2058.0, 1216.0, 831.0, 531.0, 336.0, 244.0, 151.0, 95.0, 62.0, 38.0, 28.0, 17.0, 10.0, 8.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0119781494140625, -0.011569857597351074, -0.011161565780639648, -0.010753273963928223, -0.010344982147216797, -0.009936690330505371, -0.009528398513793945, -0.00912010669708252, -0.008711814880371094, -0.008303523063659668, -0.007895231246948242, -0.007486939430236816, -0.007078647613525391, -0.006670355796813965, -0.006262063980102539, -0.005853772163391113, -0.0054454803466796875, -0.005037188529968262, -0.004628896713256836, -0.00422060489654541, -0.0038123130798339844, -0.0034040212631225586, -0.002995729446411133, -0.002587437629699707, -0.0021791458129882812, -0.0017708539962768555, -0.0013625621795654297, -0.0009542703628540039, -0.0005459785461425781, -0.00013768672943115234, 0.00027060508728027344, 0.0006788969039916992, 0.001087188720703125, 0.0014954805374145508, 0.0019037723541259766, 0.0023120641708374023, 0.002720355987548828, 0.003128647804260254, 0.0035369396209716797, 0.0039452314376831055, 0.004353523254394531, 0.004761815071105957, 0.005170106887817383, 0.005578398704528809, 0.005986690521240234, 0.00639498233795166, 0.006803274154663086, 0.007211565971374512, 0.0076198577880859375, 0.008028149604797363, 0.008436441421508789, 0.008844733238220215, 0.00925302505493164, 0.009661316871643066, 0.010069608688354492, 0.010477900505065918, 0.010886192321777344, 0.01129448413848877, 0.011702775955200195, 0.012111067771911621, 0.012519359588623047, 0.012927651405334473, 0.013335943222045898, 0.013744235038757324, 0.01415252685546875]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 5.0, 5.0, 9.0, 10.0, 9.0, 18.0, 22.0, 20.0, 27.0, 42.0, 43.0, 59.0, 69.0, 84.0, 106.0, 148.0, 140.0, 180.0, 228.0, 232.0, 328.0, 365.0, 349.0, 281.0, 235.0, 189.0, 166.0, 145.0, 116.0, 100.0, 77.0, 56.0, 43.0, 33.0, 28.0, 25.0, 21.0, 11.0, 12.0, 12.0, 7.0, 2.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.0038394927978515625, -0.0037253201007843018, -0.003611147403717041, -0.0034969747066497803, -0.0033828020095825195, -0.003268629312515259, -0.003154456615447998, -0.0030402839183807373, -0.0029261112213134766, -0.002811938524246216, -0.002697765827178955, -0.0025835931301116943, -0.0024694204330444336, -0.002355247735977173, -0.002241075038909912, -0.0021269023418426514, -0.0020127296447753906, -0.0018985569477081299, -0.0017843842506408691, -0.0016702115535736084, -0.0015560388565063477, -0.001441866159439087, -0.0013276934623718262, -0.0012135207653045654, -0.0010993480682373047, -0.000985175371170044, -0.0008710026741027832, -0.0007568299770355225, -0.0006426572799682617, -0.000528484582901001, -0.00041431188583374023, -0.0003001391887664795, -0.00018596649169921875, -7.179379463195801e-05, 4.2378902435302734e-05, 0.00015655159950256348, 0.0002707242965698242, 0.00038489699363708496, 0.0004990696907043457, 0.0006132423877716064, 0.0007274150848388672, 0.0008415877819061279, 0.0009557604789733887, 0.0010699331760406494, 0.0011841058731079102, 0.001298278570175171, 0.0014124512672424316, 0.0015266239643096924, 0.0016407966613769531, 0.0017549693584442139, 0.0018691420555114746, 0.0019833147525787354, 0.002097487449645996, 0.002211660146713257, 0.0023258328437805176, 0.0024400055408477783, 0.002554178237915039, 0.0026683509349823, 0.0027825236320495605, 0.0028966963291168213, 0.003010869026184082, 0.0031250417232513428, 0.0032392144203186035, 0.0033533871173858643, 0.003467559814453125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 7.0, 7.0, 6.0, 9.0, 14.0, 10.0, 22.0, 27.0, 21.0, 38.0, 38.0, 44.0, 47.0, 65.0, 73.0, 90.0, 91.0, 77.0, 58.0, 46.0, 35.0, 28.0, 24.0, 31.0, 11.0, 12.0, 11.0, 13.0, 8.0, 10.0, 3.0, 9.0, 5.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0087464340031147, -0.008480477146804333, -0.008214520290493965, -0.007948564365506172, -0.007682607509195805, -0.007416650652885437, -0.007150693796575069, -0.006884736940264702, -0.006618780549615622, -0.006352823693305254, -0.006086867302656174, -0.005820910446345806, -0.0055549535900354385, -0.005288997199386358, -0.005023040343075991, -0.00475708395242691, -0.004491127096116543, -0.004225170239806175, -0.003959213849157095, -0.0036932569928467274, -0.0034273003693670034, -0.0031613437458872795, -0.002895386889576912, -0.002629430266097188, -0.002363473642617464, -0.00209751701913774, -0.0018315602792426944, -0.0015656035393476486, -0.0012996469158679247, -0.0010336902923882008, -0.000767733552493155, -0.0005017768125981092, -0.0002358192577958107, 3.0137423891574144e-05, 0.000296094105578959, 0.0005620507872663438, 0.0008280074689537287, 0.0010939640924334526, 0.0013599208323284984, 0.0016258775722235441, 0.001891834195703268, 0.002157790819182992, 0.002423747442662716, 0.0026897042989730835, 0.0029556609224528074, 0.0032216175459325314, 0.003487574402242899, 0.003753531025722623, 0.004019487649202347, 0.004285444505512714, 0.004551400896161795, 0.004817357752472162, 0.0050833141431212425, 0.00534927099943161, 0.005615227855741978, 0.005881184712052345, 0.0061471411027014256, 0.006413097959011793, 0.006679054349660873, 0.006945011205971241, 0.007210968062281609, 0.007476924452930689, 0.0077428813092410564, 0.008008837699890137, 0.008274794556200504]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 1.0, 8.0, 5.0, 9.0, 15.0, 16.0, 16.0, 15.0, 13.0, 26.0, 21.0, 19.0, 31.0, 35.0, 30.0, 36.0, 43.0, 47.0, 40.0, 36.0, 51.0, 40.0, 38.0, 30.0, 35.0, 28.0, 31.0, 36.0, 37.0, 27.0, 27.0, 31.0, 19.0, 20.0, 17.0, 12.0, 10.0, 11.0, 6.0, 7.0, 9.0, 4.0, 5.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0072313533164560795, -0.007021838333457708, -0.006812323350459337, -0.006602808367460966, -0.006393292918801308, -0.0061837779358029366, -0.005974262952804565, -0.005764747969806194, -0.005555232986807823, -0.005345718003809452, -0.005136203020811081, -0.00492668803781271, -0.004717173054814339, -0.0045076580718159676, -0.004298142623156309, -0.004088627640157938, -0.003879112657159567, -0.0036695976741611958, -0.0034600826911628246, -0.00325056747533381, -0.0030410524923354387, -0.0028315375093370676, -0.002622022293508053, -0.0024125073105096817, -0.0022029923275113106, -0.0019934773445129395, -0.0017839622450992465, -0.0015744471456855536, -0.0013649321626871824, -0.0011554171796888113, -0.0009459020802751184, -0.0007363869808614254, -0.000526871532201767, -0.00031735649099573493, -0.00010784144978970289, 0.00010167359141632915, 0.0003111886326223612, 0.0005207036156207323, 0.0007302187150344253, 0.0009397338144481182, 0.0011492487974464893, 0.0013587637804448605, 0.0015682788798585534, 0.0017777939792722464, 0.0019873089622706175, 0.0021968239452689886, 0.0024063391610980034, 0.0026158541440963745, 0.0028253691270947456, 0.0030348841100931168, 0.003244399093091488, 0.0034539143089205027, 0.003663429291918874, 0.003872944274917245, 0.00408245949074626, 0.004291974473744631, 0.004501489456743002, 0.004711004439741373, 0.004920519422739744, 0.005130034405738115, 0.005339549854397774, 0.005549064837396145, 0.005758579820394516, 0.005968094803392887, 0.006177609786391258]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 6.0, 7.0, 6.0, 8.0, 12.0, 17.0, 39.0, 54.0, 66.0, 134.0, 176.0, 262.0, 454.0, 646.0, 994.0, 1452.0, 2297.0, 3770.0, 5907.0, 9717.0, 16248.0, 28152.0, 52388.0, 106367.0, 260758.0, 302861.0, 120494.0, 58549.0, 31155.0, 17737.0, 10431.0, 6365.0, 3884.0, 2467.0, 1611.0, 1052.0, 686.0, 441.0, 312.0, 192.0, 150.0, 85.0, 58.0, 36.0, 24.0, 14.0, 10.0, 3.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00225067138671875, -0.0021732747554779053, -0.0020958781242370605, -0.002018481492996216, -0.001941084861755371, -0.0018636882305145264, -0.0017862915992736816, -0.001708894968032837, -0.0016314983367919922, -0.0015541017055511475, -0.0014767050743103027, -0.001399308443069458, -0.0013219118118286133, -0.0012445151805877686, -0.0011671185493469238, -0.001089721918106079, -0.0010123252868652344, -0.0009349286556243896, -0.0008575320243835449, -0.0007801353931427002, -0.0007027387619018555, -0.0006253421306610107, -0.000547945499420166, -0.0004705488681793213, -0.00039315223693847656, -0.00031575560569763184, -0.0002383589744567871, -0.00016096234321594238, -8.356571197509766e-05, -6.16908073425293e-06, 7.12275505065918e-05, 0.00014862418174743652, 0.00022602081298828125, 0.000303417444229126, 0.0003808140754699707, 0.00045821070671081543, 0.0005356073379516602, 0.0006130039691925049, 0.0006904006004333496, 0.0007677972316741943, 0.0008451938629150391, 0.0009225904941558838, 0.0009999871253967285, 0.0010773837566375732, 0.001154780387878418, 0.0012321770191192627, 0.0013095736503601074, 0.0013869702816009521, 0.0014643669128417969, 0.0015417635440826416, 0.0016191601753234863, 0.001696556806564331, 0.0017739534378051758, 0.0018513500690460205, 0.0019287467002868652, 0.00200614333152771, 0.0020835399627685547, 0.0021609365940093994, 0.002238333225250244, 0.002315729856491089, 0.0023931264877319336, 0.0024705231189727783, 0.002547919750213623, 0.0026253163814544678, 0.0027027130126953125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 1.0, 6.0, 9.0, 8.0, 12.0, 11.0, 16.0, 17.0, 20.0, 23.0, 19.0, 21.0, 34.0, 35.0, 39.0, 42.0, 44.0, 44.0, 46.0, 40.0, 32.0, 50.0, 45.0, 40.0, 32.0, 34.0, 33.0, 30.0, 30.0, 28.0, 30.0, 30.0, 17.0, 17.0, 10.0, 9.0, 11.0, 8.0, 9.0, 5.0, 3.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00809478759765625, -0.007866621017456055, -0.007638454437255859, -0.007410287857055664, -0.007182121276855469, -0.0069539546966552734, -0.006725788116455078, -0.006497621536254883, -0.0062694549560546875, -0.006041288375854492, -0.005813121795654297, -0.0055849552154541016, -0.005356788635253906, -0.005128622055053711, -0.004900455474853516, -0.00467228889465332, -0.004444122314453125, -0.00421595573425293, -0.003987789154052734, -0.003759622573852539, -0.0035314559936523438, -0.0033032894134521484, -0.003075122833251953, -0.002846956253051758, -0.0026187896728515625, -0.002390623092651367, -0.002162456512451172, -0.0019342899322509766, -0.0017061233520507812, -0.001477956771850586, -0.0012497901916503906, -0.0010216236114501953, -0.00079345703125, -0.0005652904510498047, -0.0003371238708496094, -0.00010895729064941406, 0.00011920928955078125, 0.00034737586975097656, 0.0005755424499511719, 0.0008037090301513672, 0.0010318756103515625, 0.0012600421905517578, 0.0014882087707519531, 0.0017163753509521484, 0.0019445419311523438, 0.002172708511352539, 0.0024008750915527344, 0.0026290416717529297, 0.002857208251953125, 0.0030853748321533203, 0.0033135414123535156, 0.003541707992553711, 0.0037698745727539062, 0.0039980411529541016, 0.004226207733154297, 0.004454374313354492, 0.0046825408935546875, 0.004910707473754883, 0.005138874053955078, 0.0053670406341552734, 0.005595207214355469, 0.005823373794555664, 0.006051540374755859, 0.006279706954956055, 0.00650787353515625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 14.0, 8.0, 9.0, 16.0, 19.0, 24.0, 47.0, 59.0, 68.0, 86.0, 141.0, 154.0, 262.0, 394.0, 542.0, 754.0, 1176.0, 1815.0, 2852.0, 4614.0, 7731.0, 13711.0, 25339.0, 50879.0, 125026.0, 445010.0, 214623.0, 74783.0, 34580.0, 17672.0, 9926.0, 5885.0, 3570.0, 2187.0, 1443.0, 937.0, 623.0, 443.0, 317.0, 210.0, 169.0, 127.0, 94.0, 60.0, 34.0, 31.0, 23.0, 18.0, 18.0, 9.0, 1.0, 6.0, 5.0, 3.0, 0.0, 2.0], "bins": [-0.0038909912109375, -0.0037756264209747314, -0.003660261631011963, -0.0035448968410491943, -0.0034295320510864258, -0.0033141672611236572, -0.0031988024711608887, -0.00308343768119812, -0.0029680728912353516, -0.002852708101272583, -0.0027373433113098145, -0.002621978521347046, -0.0025066137313842773, -0.002391248941421509, -0.0022758841514587402, -0.0021605193614959717, -0.002045154571533203, -0.0019297897815704346, -0.001814424991607666, -0.0016990602016448975, -0.001583695411682129, -0.0014683306217193604, -0.0013529658317565918, -0.0012376010417938232, -0.0011222362518310547, -0.0010068714618682861, -0.0008915066719055176, -0.000776141881942749, -0.0006607770919799805, -0.0005454123020172119, -0.00043004751205444336, -0.0003146827220916748, -0.00019931793212890625, -8.39531421661377e-05, 3.141164779663086e-05, 0.00014677643775939941, 0.00026214122772216797, 0.0003775060176849365, 0.0004928708076477051, 0.0006082355976104736, 0.0007236003875732422, 0.0008389651775360107, 0.0009543299674987793, 0.0010696947574615479, 0.0011850595474243164, 0.001300424337387085, 0.0014157891273498535, 0.001531153917312622, 0.0016465187072753906, 0.0017618834972381592, 0.0018772482872009277, 0.0019926130771636963, 0.002107977867126465, 0.0022233426570892334, 0.002338707447052002, 0.0024540722370147705, 0.002569437026977539, 0.0026848018169403076, 0.002800166606903076, 0.0029155313968658447, 0.0030308961868286133, 0.003146260976791382, 0.0032616257667541504, 0.003376990556716919, 0.0034923553466796875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 7.0, 2.0, 3.0, 10.0, 9.0, 14.0, 6.0, 13.0, 19.0, 26.0, 26.0, 26.0, 31.0, 25.0, 33.0, 36.0, 35.0, 42.0, 44.0, 52.0, 44.0, 44.0, 40.0, 57.0, 35.0, 28.0, 45.0, 30.0, 35.0, 25.0, 23.0, 29.0, 21.0, 18.0, 13.0, 11.0, 9.0, 9.0, 10.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.005008697509765625, -0.004859864711761475, -0.004711031913757324, -0.004562199115753174, -0.0044133663177490234, -0.004264533519744873, -0.004115700721740723, -0.003966867923736572, -0.003818035125732422, -0.0036692023277282715, -0.003520369529724121, -0.0033715367317199707, -0.0032227039337158203, -0.00307387113571167, -0.0029250383377075195, -0.002776205539703369, -0.0026273727416992188, -0.0024785399436950684, -0.002329707145690918, -0.0021808743476867676, -0.002032041549682617, -0.0018832087516784668, -0.0017343759536743164, -0.001585543155670166, -0.0014367103576660156, -0.0012878775596618652, -0.0011390447616577148, -0.0009902119636535645, -0.0008413791656494141, -0.0006925463676452637, -0.0005437135696411133, -0.0003948807716369629, -0.0002460479736328125, -9.721517562866211e-05, 5.161762237548828e-05, 0.00020045042037963867, 0.00034928321838378906, 0.0004981160163879395, 0.0006469488143920898, 0.0007957816123962402, 0.0009446144104003906, 0.001093447208404541, 0.0012422800064086914, 0.0013911128044128418, 0.0015399456024169922, 0.0016887784004211426, 0.001837611198425293, 0.0019864439964294434, 0.0021352767944335938, 0.002284109592437744, 0.0024329423904418945, 0.002581775188446045, 0.0027306079864501953, 0.0028794407844543457, 0.003028273582458496, 0.0031771063804626465, 0.003325939178466797, 0.0034747719764709473, 0.0036236047744750977, 0.003772437572479248, 0.0039212703704833984, 0.004070103168487549, 0.004218935966491699, 0.00436776876449585, 0.0045166015625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 5.0, 15.0, 12.0, 28.0, 37.0, 38.0, 76.0, 87.0, 128.0, 183.0, 265.0, 374.0, 520.0, 804.0, 1243.0, 1889.0, 3095.0, 5474.0, 10088.0, 21427.0, 53973.0, 225319.0, 575212.0, 87485.0, 29865.0, 13340.0, 6942.0, 3949.0, 2360.0, 1387.0, 963.0, 604.0, 409.0, 270.0, 190.0, 117.0, 100.0, 77.0, 54.0, 36.0, 24.0, 22.0, 17.0, 13.0, 10.0, 9.0, 10.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.00032520294189453125, -0.000315103679895401, -0.00030500441789627075, -0.0002949051558971405, -0.00028480589389801025, -0.00027470663189888, -0.00026460736989974976, -0.0002545081079006195, -0.00024440884590148926, -0.000234309583902359, -0.00022421032190322876, -0.0002141110599040985, -0.00020401179790496826, -0.000193912535905838, -0.00018381327390670776, -0.00017371401190757751, -0.00016361474990844727, -0.00015351548790931702, -0.00014341622591018677, -0.00013331696391105652, -0.00012321770191192627, -0.00011311843991279602, -0.00010301917791366577, -9.291991591453552e-05, -8.282065391540527e-05, -7.272139191627502e-05, -6.262212991714478e-05, -5.2522867918014526e-05, -4.242360591888428e-05, -3.232434391975403e-05, -2.222508192062378e-05, -1.212581992149353e-05, -2.0265579223632812e-06, 8.072704076766968e-06, 1.8171966075897217e-05, 2.8271228075027466e-05, 3.8370490074157715e-05, 4.8469752073287964e-05, 5.856901407241821e-05, 6.866827607154846e-05, 7.876753807067871e-05, 8.886680006980896e-05, 9.896606206893921e-05, 0.00010906532406806946, 0.00011916458606719971, 0.00012926384806632996, 0.0001393631100654602, 0.00014946237206459045, 0.0001595616340637207, 0.00016966089606285095, 0.0001797601580619812, 0.00018985942006111145, 0.0001999586820602417, 0.00021005794405937195, 0.0002201572060585022, 0.00023025646805763245, 0.0002403557300567627, 0.00025045499205589294, 0.0002605542540550232, 0.00027065351605415344, 0.0002807527780532837, 0.00029085204005241394, 0.0003009513020515442, 0.00031105056405067444, 0.0003211498260498047]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 8.0, 0.0, 15.0, 0.0, 22.0, 0.0, 22.0, 0.0, 24.0, 0.0, 41.0, 0.0, 64.0, 0.0, 76.0, 0.0, 93.0, 0.0, 99.0, 0.0, 93.0, 0.0, 94.0, 0.0, 76.0, 0.0, 74.0, 0.0, 63.0, 0.0, 42.0, 0.0, 42.0, 0.0, 21.0, 0.0, 15.0, 0.0, 11.0, 0.0, 6.0, 0.0, 8.0, 0.0, 5.0, 0.0, 1.0, 1.0], "bins": [-1.0728836059570312e-06, -1.043081283569336e-06, -1.0132789611816406e-06, -9.834766387939453e-07, -9.5367431640625e-07, -9.238719940185547e-07, -8.940696716308594e-07, -8.642673492431641e-07, -8.344650268554688e-07, -8.046627044677734e-07, -7.748603820800781e-07, -7.450580596923828e-07, -7.152557373046875e-07, -6.854534149169922e-07, -6.556510925292969e-07, -6.258487701416016e-07, -5.960464477539062e-07, -5.662441253662109e-07, -5.364418029785156e-07, -5.066394805908203e-07, -4.76837158203125e-07, -4.470348358154297e-07, -4.172325134277344e-07, -3.8743019104003906e-07, -3.5762786865234375e-07, -3.2782554626464844e-07, -2.980232238769531e-07, -2.682209014892578e-07, -2.384185791015625e-07, -2.086162567138672e-07, -1.7881393432617188e-07, -1.4901161193847656e-07, -1.1920928955078125e-07, -8.940696716308594e-08, -5.960464477539063e-08, -2.9802322387695312e-08, 0.0, 2.9802322387695312e-08, 5.960464477539063e-08, 8.940696716308594e-08, 1.1920928955078125e-07, 1.4901161193847656e-07, 1.7881393432617188e-07, 2.086162567138672e-07, 2.384185791015625e-07, 2.682209014892578e-07, 2.980232238769531e-07, 3.2782554626464844e-07, 3.5762786865234375e-07, 3.8743019104003906e-07, 4.172325134277344e-07, 4.470348358154297e-07, 4.76837158203125e-07, 5.066394805908203e-07, 5.364418029785156e-07, 5.662441253662109e-07, 5.960464477539062e-07, 6.258487701416016e-07, 6.556510925292969e-07, 6.854534149169922e-07, 7.152557373046875e-07, 7.450580596923828e-07, 7.748603820800781e-07, 8.046627044677734e-07, 8.344650268554688e-07]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 12.0, 14.0, 14.0, 12.0, 41.0, 57.0, 65.0, 94.0, 139.0, 228.0, 308.0, 459.0, 666.0, 961.0, 1347.0, 2059.0, 3207.0, 5081.0, 8752.0, 15989.0, 36855.0, 114494.0, 584530.0, 177429.0, 48714.0, 19963.0, 10351.0, 5817.0, 3619.0, 2308.0, 1533.0, 1076.0, 697.0, 491.0, 381.0, 228.0, 165.0, 121.0, 97.0, 50.0, 29.0, 39.0, 28.0, 14.0, 5.0, 5.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000522613525390625, -0.0005055591464042664, -0.0004885047674179077, -0.00047145038843154907, -0.00045439600944519043, -0.0004373416304588318, -0.00042028725147247314, -0.0004032328724861145, -0.00038617849349975586, -0.0003691241145133972, -0.0003520697355270386, -0.00033501535654067993, -0.0003179609775543213, -0.00030090659856796265, -0.000283852219581604, -0.00026679784059524536, -0.0002497434616088867, -0.00023268908262252808, -0.00021563470363616943, -0.0001985803246498108, -0.00018152594566345215, -0.0001644715666770935, -0.00014741718769073486, -0.00013036280870437622, -0.00011330842971801758, -9.625405073165894e-05, -7.919967174530029e-05, -6.214529275894165e-05, -4.509091377258301e-05, -2.8036534786224365e-05, -1.0982155799865723e-05, 6.07222318649292e-06, 2.3126602172851562e-05, 4.0180981159210205e-05, 5.723536014556885e-05, 7.428973913192749e-05, 9.134411811828613e-05, 0.00010839849710464478, 0.00012545287609100342, 0.00014250725507736206, 0.0001595616340637207, 0.00017661601305007935, 0.000193670392036438, 0.00021072477102279663, 0.00022777915000915527, 0.0002448335289955139, 0.00026188790798187256, 0.0002789422869682312, 0.00029599666595458984, 0.0003130510449409485, 0.00033010542392730713, 0.00034715980291366577, 0.0003642141819000244, 0.00038126856088638306, 0.0003983229398727417, 0.00041537731885910034, 0.000432431697845459, 0.0004494860768318176, 0.00046654045581817627, 0.0004835948348045349, 0.0005006492137908936, 0.0005177035927772522, 0.0005347579717636108, 0.0005518123507499695, 0.0005688667297363281]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 6.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 7.0, 6.0, 8.0, 12.0, 13.0, 22.0, 25.0, 30.0, 32.0, 52.0, 53.0, 68.0, 110.0, 142.0, 89.0, 65.0, 51.0, 27.0, 39.0, 19.0, 22.0, 12.0, 15.0, 10.0, 15.0, 6.0, 5.0, 10.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00011831521987915039, -0.00011442508548498154, -0.00011053495109081268, -0.00010664481669664383, -0.00010275468230247498, -9.886454790830612e-05, -9.497441351413727e-05, -9.108427911996841e-05, -8.719414472579956e-05, -8.330401033163071e-05, -7.941387593746185e-05, -7.5523741543293e-05, -7.163360714912415e-05, -6.774347275495529e-05, -6.385333836078644e-05, -5.9963203966617584e-05, -5.607306957244873e-05, -5.218293517827988e-05, -4.829280078411102e-05, -4.440266638994217e-05, -4.0512531995773315e-05, -3.662239760160446e-05, -3.273226320743561e-05, -2.8842128813266754e-05, -2.49519944190979e-05, -2.1061860024929047e-05, -1.7171725630760193e-05, -1.3281591236591339e-05, -9.391456842422485e-06, -5.501322448253632e-06, -1.6111880540847778e-06, 2.278946340084076e-06, 6.16908073425293e-06, 1.0059215128421783e-05, 1.3949349522590637e-05, 1.783948391675949e-05, 2.1729618310928345e-05, 2.56197527050972e-05, 2.9509887099266052e-05, 3.3400021493434906e-05, 3.729015588760376e-05, 4.1180290281772614e-05, 4.507042467594147e-05, 4.896055907011032e-05, 5.2850693464279175e-05, 5.674082785844803e-05, 6.063096225261688e-05, 6.452109664678574e-05, 6.841123104095459e-05, 7.230136543512344e-05, 7.61914998292923e-05, 8.008163422346115e-05, 8.397176861763e-05, 8.786190301179886e-05, 9.175203740596771e-05, 9.564217180013657e-05, 9.953230619430542e-05, 0.00010342244058847427, 0.00010731257498264313, 0.00011120270937681198, 0.00011509284377098083, 0.00011898297816514969, 0.00012287311255931854, 0.0001267632469534874, 0.00013065338134765625]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 7.0, 6.0, 3.0, 9.0, 16.0, 10.0, 15.0, 24.0, 35.0, 33.0, 34.0, 40.0, 56.0, 55.0, 64.0, 100.0, 86.0, 88.0, 52.0, 48.0, 42.0, 21.0, 29.0, 28.0, 18.0, 8.0, 17.0, 7.0, 10.0, 6.0, 6.0, 10.0, 5.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.008719380013644695, -0.008455540984869003, -0.008191701956093311, -0.007927863858640194, -0.007664024829864502, -0.00740018580108881, -0.007136346772313118, -0.006872508209198713, -0.006608669646084309, -0.006344830617308617, -0.006080992054194212, -0.00581715302541852, -0.005553314462304115, -0.005289475433528423, -0.005025636404752731, -0.004761797841638327, -0.004497958812862635, -0.004234119784086943, -0.003970281220972538, -0.003706442192196846, -0.0034426036290824413, -0.0031787646003067493, -0.002914925804361701, -0.0026510870084166527, -0.0023872482124716043, -0.002123409416526556, -0.0018595706205815077, -0.0015957317082211375, -0.0013318929122760892, -0.0010680541163310409, -0.0008042152039706707, -0.0005403764080256224, -0.00027653761208057404, -1.2698787031695247e-05, 0.00025114003801718354, 0.0005149788921698928, 0.0007788176881149411, 0.0010426564840599895, 0.0013064953964203596, 0.001570334192365408, 0.0018341729883104563, 0.0020980117842555046, 0.002361850580200553, 0.0026256893761456013, 0.0028895284049212933, 0.003153366968035698, 0.00341720599681139, 0.0036810447927564383, 0.003944883588701487, 0.004208722617477179, 0.004472561180591583, 0.004736400209367275, 0.00500023877248168, 0.005264077801257372, 0.005527916364371777, 0.005791755393147469, 0.0060555944219231606, 0.0063194334506988525, 0.006583272013813257, 0.006847111042588949, 0.007110949605703354, 0.007374788634479046, 0.007638627663254738, 0.007902465760707855, 0.008166304789483547]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 1.0, 8.0, 6.0, 9.0, 16.0, 14.0, 16.0, 15.0, 15.0, 23.0, 25.0, 16.0, 32.0, 34.0, 30.0, 37.0, 43.0, 47.0, 38.0, 37.0, 49.0, 44.0, 38.0, 29.0, 33.0, 28.0, 31.0, 38.0, 35.0, 27.0, 28.0, 28.0, 20.0, 21.0, 17.0, 13.0, 9.0, 11.0, 7.0, 7.0, 9.0, 4.0, 5.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.007268261164426804, -0.007060110569000244, -0.006851959973573685, -0.006643808912485838, -0.0064356583170592785, -0.006227507721632719, -0.006019356660544872, -0.005811206065118313, -0.005603055469691753, -0.005394904874265194, -0.0051867542788386345, -0.004978603217750788, -0.004770452622324228, -0.004562302026897669, -0.004354150965809822, -0.004146000370383263, -0.003937849774956703, -0.0037296991795301437, -0.0035215483512729406, -0.0033133975230157375, -0.003105246927589178, -0.0028970963321626186, -0.0026889455039054155, -0.0024807946756482124, -0.002272644080221653, -0.0020644934847950935, -0.0018563426565378904, -0.0016481919446960092, -0.0014400412328541279, -0.0012318905210122466, -0.0010237398091703653, -0.0008155890973284841, -0.0006074379198253155, -0.0003992872079834342, -0.00019113649614155293, 1.701421570032835e-05, 0.00022516492754220963, 0.0004333156393840909, 0.0006414663512259722, 0.0008496170630678535, 0.0010577677749097347, 0.001265918486751616, 0.0014740691985934973, 0.0016822199104353786, 0.0018903706222772598, 0.0020985212177038193, 0.0023066720459610224, 0.0025148228742182255, 0.002722973469644785, 0.0029311240650713444, 0.0031392748933285475, 0.0033474257215857506, 0.00355557631701231, 0.0037637269124388695, 0.003971877507865429, 0.004180028568953276, 0.004388179164379835, 0.004596329759806395, 0.004804480820894241, 0.005012631416320801, 0.00522078201174736, 0.00542893260717392, 0.005637083202600479, 0.005845234263688326, 0.006053384859114885]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 5.0, 5.0, 9.0, 12.0, 24.0, 33.0, 51.0, 83.0, 106.0, 169.0, 263.0, 369.0, 595.0, 816.0, 1310.0, 1910.0, 2842.0, 4184.0, 6446.0, 9820.0, 15211.0, 24296.0, 40197.0, 69191.0, 131118.0, 259425.0, 218154.0, 107492.0, 59071.0, 34756.0, 21298.0, 13450.0, 8698.0, 5647.0, 3809.0, 2517.0, 1699.0, 1192.0, 765.0, 526.0, 337.0, 242.0, 136.0, 106.0, 63.0, 48.0, 24.0, 19.0, 10.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.01314544677734375, -0.012745380401611328, -0.012345314025878906, -0.011945247650146484, -0.011545181274414062, -0.01114511489868164, -0.010745048522949219, -0.010344982147216797, -0.009944915771484375, -0.009544849395751953, -0.009144783020019531, -0.00874471664428711, -0.008344650268554688, -0.007944583892822266, -0.007544517517089844, -0.007144451141357422, -0.006744384765625, -0.006344318389892578, -0.005944252014160156, -0.005544185638427734, -0.0051441192626953125, -0.004744052886962891, -0.004343986511230469, -0.003943920135498047, -0.003543853759765625, -0.003143787384033203, -0.0027437210083007812, -0.0023436546325683594, -0.0019435882568359375, -0.0015435218811035156, -0.0011434555053710938, -0.0007433891296386719, -0.00034332275390625, 5.6743621826171875e-05, 0.00045680999755859375, 0.0008568763732910156, 0.0012569427490234375, 0.0016570091247558594, 0.0020570755004882812, 0.002457141876220703, 0.002857208251953125, 0.003257274627685547, 0.0036573410034179688, 0.004057407379150391, 0.0044574737548828125, 0.004857540130615234, 0.005257606506347656, 0.005657672882080078, 0.0060577392578125, 0.006457805633544922, 0.006857872009277344, 0.007257938385009766, 0.0076580047607421875, 0.00805807113647461, 0.008458137512207031, 0.008858203887939453, 0.009258270263671875, 0.009658336639404297, 0.010058403015136719, 0.01045846939086914, 0.010858535766601562, 0.011258602142333984, 0.011658668518066406, 0.012058734893798828, 0.01245880126953125]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 4.0, 6.0, 6.0, 6.0, 7.0, 13.0, 14.0, 20.0, 12.0, 11.0, 22.0, 17.0, 21.0, 26.0, 25.0, 36.0, 41.0, 44.0, 50.0, 49.0, 41.0, 47.0, 40.0, 48.0, 37.0, 36.0, 30.0, 34.0, 38.0, 39.0, 27.0, 23.0, 22.0, 25.0, 14.0, 12.0, 13.0, 10.0, 6.0, 7.0, 4.0, 10.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.006359100341796875, -0.006176352500915527, -0.00599360466003418, -0.005810856819152832, -0.005628108978271484, -0.005445361137390137, -0.005262613296508789, -0.005079865455627441, -0.004897117614746094, -0.004714369773864746, -0.0045316219329833984, -0.004348874092102051, -0.004166126251220703, -0.0039833784103393555, -0.003800630569458008, -0.00361788272857666, -0.0034351348876953125, -0.003252387046813965, -0.003069639205932617, -0.0028868913650512695, -0.002704143524169922, -0.0025213956832885742, -0.0023386478424072266, -0.002155900001525879, -0.0019731521606445312, -0.0017904043197631836, -0.001607656478881836, -0.0014249086380004883, -0.0012421607971191406, -0.001059412956237793, -0.0008766651153564453, -0.0006939172744750977, -0.00051116943359375, -0.00032842159271240234, -0.0001456737518310547, 3.707408905029297e-05, 0.00021982192993164062, 0.0004025697708129883, 0.0005853176116943359, 0.0007680654525756836, 0.0009508132934570312, 0.001133561134338379, 0.0013163089752197266, 0.0014990568161010742, 0.0016818046569824219, 0.0018645524978637695, 0.002047300338745117, 0.002230048179626465, 0.0024127960205078125, 0.00259554386138916, 0.002778291702270508, 0.0029610395431518555, 0.003143787384033203, 0.0033265352249145508, 0.0035092830657958984, 0.003692030906677246, 0.0038747787475585938, 0.004057526588439941, 0.004240274429321289, 0.004423022270202637, 0.004605770111083984, 0.004788517951965332, 0.00497126579284668, 0.005154013633728027, 0.005336761474609375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 9.0, 8.0, 13.0, 23.0, 22.0, 31.0, 58.0, 77.0, 94.0, 185.0, 214.0, 334.0, 507.0, 771.0, 1101.0, 1728.0, 2617.0, 4126.0, 6542.0, 10592.0, 17461.0, 29017.0, 50163.0, 91249.0, 180005.0, 291013.0, 160941.0, 83261.0, 46201.0, 26668.0, 16174.0, 9876.0, 6136.0, 3875.0, 2521.0, 1636.0, 1085.0, 704.0, 494.0, 333.0, 216.0, 156.0, 108.0, 63.0, 45.0, 44.0, 17.0, 15.0, 13.0, 7.0, 7.0, 1.0, 2.0, 5.0, 2.0], "bins": [-0.01418304443359375, -0.01377105712890625, -0.01335906982421875, -0.01294708251953125, -0.01253509521484375, -0.01212310791015625, -0.01171112060546875, -0.01129913330078125, -0.01088714599609375, -0.01047515869140625, -0.01006317138671875, -0.00965118408203125, -0.00923919677734375, -0.00882720947265625, -0.00841522216796875, -0.00800323486328125, -0.00759124755859375, -0.00717926025390625, -0.00676727294921875, -0.00635528564453125, -0.00594329833984375, -0.00553131103515625, -0.00511932373046875, -0.00470733642578125, -0.00429534912109375, -0.00388336181640625, -0.00347137451171875, -0.00305938720703125, -0.00264739990234375, -0.00223541259765625, -0.00182342529296875, -0.00141143798828125, -0.00099945068359375, -0.00058746337890625, -0.00017547607421875, 0.00023651123046875, 0.00064849853515625, 0.00106048583984375, 0.00147247314453125, 0.00188446044921875, 0.00229644775390625, 0.00270843505859375, 0.00312042236328125, 0.00353240966796875, 0.00394439697265625, 0.00435638427734375, 0.00476837158203125, 0.00518035888671875, 0.00559234619140625, 0.00600433349609375, 0.00641632080078125, 0.00682830810546875, 0.00724029541015625, 0.00765228271484375, 0.00806427001953125, 0.00847625732421875, 0.00888824462890625, 0.00930023193359375, 0.00971221923828125, 0.01012420654296875, 0.01053619384765625, 0.01094818115234375, 0.01136016845703125, 0.01177215576171875, 0.01218414306640625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 1.0, 4.0, 7.0, 3.0, 9.0, 9.0, 8.0, 12.0, 14.0, 14.0, 28.0, 17.0, 24.0, 20.0, 34.0, 35.0, 37.0, 28.0, 38.0, 44.0, 40.0, 37.0, 29.0, 36.0, 46.0, 37.0, 43.0, 32.0, 39.0, 29.0, 36.0, 23.0, 22.0, 28.0, 22.0, 23.0, 13.0, 14.0, 15.0, 15.0, 7.0, 8.0, 8.0, 4.0, 5.0, 7.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00362396240234375, -0.0035143494606018066, -0.0034047365188598633, -0.00329512357711792, -0.0031855106353759766, -0.003075897693634033, -0.00296628475189209, -0.0028566718101501465, -0.002747058868408203, -0.0026374459266662598, -0.0025278329849243164, -0.002418220043182373, -0.0023086071014404297, -0.0021989941596984863, -0.002089381217956543, -0.0019797682762145996, -0.0018701553344726562, -0.0017605423927307129, -0.0016509294509887695, -0.0015413165092468262, -0.0014317035675048828, -0.0013220906257629395, -0.001212477684020996, -0.0011028647422790527, -0.0009932518005371094, -0.000883638858795166, -0.0007740259170532227, -0.0006644129753112793, -0.0005548000335693359, -0.0004451870918273926, -0.0003355741500854492, -0.00022596120834350586, -0.0001163482666015625, -6.735324859619141e-06, 0.00010287761688232422, 0.00021249055862426758, 0.00032210350036621094, 0.0004317164421081543, 0.0005413293838500977, 0.000650942325592041, 0.0007605552673339844, 0.0008701682090759277, 0.000979781150817871, 0.0010893940925598145, 0.0011990070343017578, 0.0013086199760437012, 0.0014182329177856445, 0.0015278458595275879, 0.0016374588012695312, 0.0017470717430114746, 0.001856684684753418, 0.0019662976264953613, 0.0020759105682373047, 0.002185523509979248, 0.0022951364517211914, 0.0024047493934631348, 0.002514362335205078, 0.0026239752769470215, 0.002733588218688965, 0.002843201160430908, 0.0029528141021728516, 0.003062427043914795, 0.0031720399856567383, 0.0032816529273986816, 0.003391265869140625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 5.0, 5.0, 9.0, 14.0, 22.0, 30.0, 43.0, 62.0, 68.0, 105.0, 141.0, 231.0, 323.0, 402.0, 608.0, 891.0, 1285.0, 1964.0, 2852.0, 4587.0, 7458.0, 12546.0, 23428.0, 48728.0, 135611.0, 669249.0, 67335.0, 29965.0, 15642.0, 8905.0, 5414.0, 3477.0, 2248.0, 1484.0, 1064.0, 708.0, 492.0, 336.0, 242.0, 158.0, 111.0, 87.0, 69.0, 52.0, 33.0, 18.0, 24.0, 10.0, 5.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0002865791320800781, -0.0002773888409137726, -0.00026819854974746704, -0.0002590082585811615, -0.00024981796741485596, -0.00024062767624855042, -0.00023143738508224487, -0.00022224709391593933, -0.0002130568027496338, -0.00020386651158332825, -0.0001946762204170227, -0.00018548592925071716, -0.00017629563808441162, -0.00016710534691810608, -0.00015791505575180054, -0.000148724764585495, -0.00013953447341918945, -0.0001303441822528839, -0.00012115389108657837, -0.00011196359992027283, -0.00010277330875396729, -9.358301758766174e-05, -8.43927264213562e-05, -7.520243525505066e-05, -6.601214408874512e-05, -5.6821852922439575e-05, -4.763156175613403e-05, -3.844127058982849e-05, -2.925097942352295e-05, -2.0060688257217407e-05, -1.0870397090911865e-05, -1.6801059246063232e-06, 7.510185241699219e-06, 1.670047640800476e-05, 2.5890767574310303e-05, 3.5081058740615845e-05, 4.427134990692139e-05, 5.346164107322693e-05, 6.265193223953247e-05, 7.184222340583801e-05, 8.103251457214355e-05, 9.02228057384491e-05, 9.941309690475464e-05, 0.00010860338807106018, 0.00011779367923736572, 0.00012698397040367126, 0.0001361742615699768, 0.00014536455273628235, 0.0001545548439025879, 0.00016374513506889343, 0.00017293542623519897, 0.00018212571740150452, 0.00019131600856781006, 0.0002005062997341156, 0.00020969659090042114, 0.00021888688206672668, 0.00022807717323303223, 0.00023726746439933777, 0.0002464577555656433, 0.00025564804673194885, 0.0002648383378982544, 0.00027402862906455994, 0.0002832189202308655, 0.000292409211397171, 0.00030159950256347656]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 7.0, 0.0, 6.0, 0.0, 9.0, 13.0, 0.0, 18.0, 24.0, 0.0, 46.0, 0.0, 70.0, 90.0, 0.0, 413.0, 96.0, 0.0, 61.0, 0.0, 51.0, 35.0, 0.0, 19.0, 16.0, 0.0, 10.0, 0.0, 3.0, 5.0, 0.0, 6.0, 1.0, 0.0, 3.0, 0.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0132789611816406e-06, -9.760260581970215e-07, -9.387731552124023e-07, -9.015202522277832e-07, -8.642673492431641e-07, -8.270144462585449e-07, -7.897615432739258e-07, -7.525086402893066e-07, -7.152557373046875e-07, -6.780028343200684e-07, -6.407499313354492e-07, -6.034970283508301e-07, -5.662441253662109e-07, -5.289912223815918e-07, -4.917383193969727e-07, -4.544854164123535e-07, -4.172325134277344e-07, -3.7997961044311523e-07, -3.427267074584961e-07, -3.0547380447387695e-07, -2.682209014892578e-07, -2.3096799850463867e-07, -1.9371509552001953e-07, -1.564621925354004e-07, -1.1920928955078125e-07, -8.195638656616211e-08, -4.470348358154297e-08, -7.450580596923828e-09, 2.9802322387695312e-08, 6.705522537231445e-08, 1.043081283569336e-07, 1.4156103134155273e-07, 1.7881393432617188e-07, 2.1606683731079102e-07, 2.5331974029541016e-07, 2.905726432800293e-07, 3.2782554626464844e-07, 3.650784492492676e-07, 4.023313522338867e-07, 4.3958425521850586e-07, 4.76837158203125e-07, 5.140900611877441e-07, 5.513429641723633e-07, 5.885958671569824e-07, 6.258487701416016e-07, 6.631016731262207e-07, 7.003545761108398e-07, 7.37607479095459e-07, 7.748603820800781e-07, 8.121132850646973e-07, 8.493661880493164e-07, 8.866190910339355e-07, 9.238719940185547e-07, 9.611248970031738e-07, 9.98377799987793e-07, 1.0356307029724121e-06, 1.0728836059570312e-06, 1.1101365089416504e-06, 1.1473894119262695e-06, 1.1846423149108887e-06, 1.2218952178955078e-06, 1.259148120880127e-06, 1.296401023864746e-06, 1.3336539268493652e-06, 1.3709068298339844e-06]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 5.0, 6.0, 9.0, 20.0, 19.0, 27.0, 26.0, 42.0, 49.0, 49.0, 88.0, 138.0, 162.0, 227.0, 273.0, 440.0, 639.0, 927.0, 1391.0, 2186.0, 3636.0, 6344.0, 11913.0, 26538.0, 73957.0, 727468.0, 118585.0, 37411.0, 15928.0, 7966.0, 4321.0, 2606.0, 1701.0, 1017.0, 727.0, 448.0, 320.0, 239.0, 167.0, 123.0, 94.0, 86.0, 71.0, 54.0, 35.0, 20.0, 18.0, 13.0, 12.0, 9.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.0003941059112548828, -0.0003820471465587616, -0.0003699883818626404, -0.00035792961716651917, -0.00034587085247039795, -0.00033381208777427673, -0.0003217533230781555, -0.0003096945583820343, -0.0002976357936859131, -0.00028557702898979187, -0.00027351826429367065, -0.00026145949959754944, -0.0002494007349014282, -0.000237341970205307, -0.0002252832055091858, -0.00021322444081306458, -0.00020116567611694336, -0.00018910691142082214, -0.00017704814672470093, -0.0001649893820285797, -0.0001529306173324585, -0.00014087185263633728, -0.00012881308794021606, -0.00011675432324409485, -0.00010469555854797363, -9.263679385185242e-05, -8.05780291557312e-05, -6.851926445960999e-05, -5.646049976348877e-05, -4.4401735067367554e-05, -3.234297037124634e-05, -2.0284205675125122e-05, -8.225440979003906e-06, 3.8333237171173096e-06, 1.5892088413238525e-05, 2.795085310935974e-05, 4.000961780548096e-05, 5.206838250160217e-05, 6.412714719772339e-05, 7.61859118938446e-05, 8.824467658996582e-05, 0.00010030344128608704, 0.00011236220598220825, 0.00012442097067832947, 0.00013647973537445068, 0.0001485385000705719, 0.00016059726476669312, 0.00017265602946281433, 0.00018471479415893555, 0.00019677355885505676, 0.00020883232355117798, 0.0002208910882472992, 0.0002329498529434204, 0.0002450086176395416, 0.00025706738233566284, 0.00026912614703178406, 0.0002811849117279053, 0.0002932436764240265, 0.0003053024411201477, 0.0003173612058162689, 0.00032941997051239014, 0.00034147873520851135, 0.00035353749990463257, 0.0003655962646007538, 0.000377655029296875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 4.0, 6.0, 5.0, 9.0, 11.0, 15.0, 21.0, 23.0, 32.0, 51.0, 47.0, 120.0, 445.0, 46.0, 45.0, 36.0, 28.0, 13.0, 10.0, 6.0, 5.0, 4.0, 7.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.0001392364501953125, -0.00013536959886550903, -0.00013150274753570557, -0.0001276358962059021, -0.00012376904487609863, -0.00011990219354629517, -0.0001160353422164917, -0.00011216849088668823, -0.00010830163955688477, -0.0001044347882270813, -0.00010056793689727783, -9.670108556747437e-05, -9.28342342376709e-05, -8.896738290786743e-05, -8.510053157806396e-05, -8.12336802482605e-05, -7.736682891845703e-05, -7.349997758865356e-05, -6.96331262588501e-05, -6.576627492904663e-05, -6.189942359924316e-05, -5.80325722694397e-05, -5.416572093963623e-05, -5.0298869609832764e-05, -4.64320182800293e-05, -4.256516695022583e-05, -3.869831562042236e-05, -3.4831464290618896e-05, -3.096461296081543e-05, -2.7097761631011963e-05, -2.3230910301208496e-05, -1.936405897140503e-05, -1.5497207641601562e-05, -1.1630356311798096e-05, -7.763504981994629e-06, -3.896653652191162e-06, -2.9802322387695312e-08, 3.8370490074157715e-06, 7.703900337219238e-06, 1.1570751667022705e-05, 1.5437602996826172e-05, 1.930445432662964e-05, 2.3171305656433105e-05, 2.7038156986236572e-05, 3.090500831604004e-05, 3.4771859645843506e-05, 3.863871097564697e-05, 4.250556230545044e-05, 4.6372413635253906e-05, 5.023926496505737e-05, 5.410611629486084e-05, 5.797296762466431e-05, 6.183981895446777e-05, 6.570667028427124e-05, 6.957352161407471e-05, 7.344037294387817e-05, 7.730722427368164e-05, 8.117407560348511e-05, 8.504092693328857e-05, 8.890777826309204e-05, 9.277462959289551e-05, 9.664148092269897e-05, 0.00010050833225250244, 0.00010437518358230591, 0.00010824203491210938]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 2.0, 7.0, 7.0, 10.0, 9.0, 29.0, 17.0, 39.0, 34.0, 53.0, 59.0, 63.0, 73.0, 77.0, 84.0, 93.0, 78.0, 38.0, 42.0, 42.0, 22.0, 28.0, 9.0, 15.0, 10.0, 8.0, 8.0, 7.0, 5.0, 7.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.007920975796878338, -0.007674016058444977, -0.0074270558543503284, -0.007180096115916967, -0.006933135911822319, -0.006686176173388958, -0.006439216434955597, -0.006192256696522236, -0.0059452964924275875, -0.0056983367539942265, -0.005451376549899578, -0.005204416811466217, -0.004957457073032856, -0.004710496868938208, -0.004463537130504847, -0.004216576926410198, -0.003969617187976837, -0.0037226572167128325, -0.0034756972454488277, -0.0032287375070154667, -0.002981777535751462, -0.0027348175644874573, -0.0024878578260540962, -0.0022408978547900915, -0.001993937883526087, -0.001746977912262082, -0.0015000180574133992, -0.0012530582025647163, -0.0010060982313007116, -0.0007591382600367069, -0.000512178405188024, -0.00026521855033934116, -1.825764775276184e-05, 0.00022870226530358195, 0.00047566217835992575, 0.0007226220914162695, 0.0009695820044726133, 0.001216541975736618, 0.001463501830585301, 0.0017104616854339838, 0.0019574216566979885, 0.0022043816279619932, 0.002451341599225998, 0.002698301337659359, 0.0029452613089233637, 0.0031922212801873684, 0.0034391810186207294, 0.003686140989884734, 0.003933100961148739, 0.0041800606995821, 0.004427020903676748, 0.004673980642110109, 0.004920940846204758, 0.005167900584638119, 0.00541486032307148, 0.005661820061504841, 0.005908780265599489, 0.00615574000403285, 0.006402700208127499, 0.00664965994656086, 0.006896619684994221, 0.007143579889088869, 0.00739053962752223, 0.0076374998316168785, 0.00788445957005024]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 2.0, 4.0, 13.0, 5.0, 6.0, 9.0, 15.0, 11.0, 18.0, 20.0, 28.0, 20.0, 20.0, 26.0, 29.0, 33.0, 38.0, 26.0, 40.0, 36.0, 41.0, 38.0, 40.0, 43.0, 37.0, 39.0, 37.0, 37.0, 31.0, 28.0, 31.0, 21.0, 23.0, 21.0, 29.0, 15.0, 17.0, 14.0, 10.0, 10.0, 10.0, 5.0, 7.0, 2.0, 2.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.0060332706198096275, -0.005857438314706087, -0.005681605543941259, -0.005505773238837719, -0.0053299409337341785, -0.005154108162969351, -0.00497827585786581, -0.004802443087100983, -0.004626610781997442, -0.004450778476893902, -0.004274945706129074, -0.004099113401025534, -0.003923281095921993, -0.0037474483251571655, -0.003571616020053625, -0.003395783482119441, -0.0032199511770159006, -0.0030441186390817165, -0.002868286333978176, -0.002692453796043992, -0.002516621258109808, -0.0023407889530062675, -0.0021649564150720835, -0.0019891238771378994, -0.0018132914556190372, -0.001637459034100175, -0.0014616264961659908, -0.0012857940746471286, -0.0011099616531282663, -0.0009341291151940823, -0.00075829669367522, -0.0005824641557410359, -0.0004066317342221737, -0.00023079926904756576, -5.4966803872957826e-05, 0.00012086564674973488, 0.00029669812647625804, 0.0004725306062027812, 0.0006483630277216434, 0.0008241955656558275, 0.0010000279871746898, 0.001175860408693552, 0.001351692946627736, 0.0015275253681465983, 0.0017033577896654606, 0.0018791903275996447, 0.0020550228655338287, 0.002230855170637369, 0.0024066877085715532, 0.0025825202465057373, 0.0027583525516092777, 0.002934185089543462, 0.003110017627477646, 0.0032858499325811863, 0.0034616824705153704, 0.0036375150084495544, 0.003813347313553095, 0.003989179618656635, 0.004165012389421463, 0.004340844694525003, 0.004516676999628544, 0.004692509770393372, 0.004868342075496912, 0.005044174380600452, 0.00522000715136528]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 6.0, 10.0, 12.0, 9.0, 17.0, 14.0, 26.0, 32.0, 41.0, 63.0, 75.0, 119.0, 178.0, 259.0, 384.0, 483.0, 792.0, 1112.0, 1563.0, 2349.0, 3412.0, 5204.0, 8104.0, 13179.0, 22684.0, 39940.0, 74579.0, 155360.0, 440461.0, 1705977.0, 1151530.0, 291762.0, 122050.0, 62870.0, 35387.0, 20545.0, 12364.0, 7381.0, 4813.0, 3028.0, 2008.0, 1315.0, 893.0, 617.0, 441.0, 279.0, 207.0, 135.0, 77.0, 55.0, 36.0, 22.0, 17.0, 4.0, 4.0, 1.0, 4.0], "bins": [-0.01001739501953125, -0.009745419025421143, -0.009473443031311035, -0.009201467037200928, -0.00892949104309082, -0.008657515048980713, -0.008385539054870605, -0.008113563060760498, -0.00784158706665039, -0.007569611072540283, -0.007297635078430176, -0.007025659084320068, -0.006753683090209961, -0.0064817070960998535, -0.006209731101989746, -0.005937755107879639, -0.005665779113769531, -0.005393803119659424, -0.005121827125549316, -0.004849851131439209, -0.0045778751373291016, -0.004305899143218994, -0.004033923149108887, -0.0037619471549987793, -0.003489971160888672, -0.0032179951667785645, -0.002946019172668457, -0.0026740431785583496, -0.002402067184448242, -0.0021300911903381348, -0.0018581151962280273, -0.00158613920211792, -0.0013141632080078125, -0.001042187213897705, -0.0007702112197875977, -0.0004982352256774902, -0.0002262592315673828, 4.571676254272461e-05, 0.00031769275665283203, 0.0005896687507629395, 0.0008616447448730469, 0.0011336207389831543, 0.0014055967330932617, 0.0016775727272033691, 0.0019495487213134766, 0.002221524715423584, 0.0024935007095336914, 0.002765476703643799, 0.0030374526977539062, 0.0033094286918640137, 0.003581404685974121, 0.0038533806800842285, 0.004125356674194336, 0.004397332668304443, 0.004669308662414551, 0.004941284656524658, 0.005213260650634766, 0.005485236644744873, 0.0057572126388549805, 0.006029188632965088, 0.006301164627075195, 0.006573140621185303, 0.00684511661529541, 0.007117092609405518, 0.007389068603515625]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 6.0, 9.0, 6.0, 10.0, 7.0, 14.0, 11.0, 20.0, 15.0, 18.0, 26.0, 30.0, 27.0, 35.0, 39.0, 41.0, 38.0, 55.0, 59.0, 48.0, 40.0, 38.0, 32.0, 39.0, 53.0, 28.0, 35.0, 38.0, 24.0, 25.0, 20.0, 18.0, 14.0, 22.0, 15.0, 9.0, 12.0, 5.0, 3.0, 3.0, 1.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.00424957275390625, -0.00413098931312561, -0.004012405872344971, -0.003893822431564331, -0.0037752389907836914, -0.0036566555500030518, -0.003538072109222412, -0.0034194886684417725, -0.003300905227661133, -0.003182321786880493, -0.0030637383460998535, -0.002945154905319214, -0.0028265714645385742, -0.0027079880237579346, -0.002589404582977295, -0.0024708211421966553, -0.0023522377014160156, -0.002233654260635376, -0.0021150708198547363, -0.0019964873790740967, -0.001877903938293457, -0.0017593204975128174, -0.0016407370567321777, -0.001522153615951538, -0.0014035701751708984, -0.0012849867343902588, -0.0011664032936096191, -0.0010478198528289795, -0.0009292364120483398, -0.0008106529712677002, -0.0006920695304870605, -0.0005734860897064209, -0.00045490264892578125, -0.0003363192081451416, -0.00021773576736450195, -9.91523265838623e-05, 1.9431114196777344e-05, 0.000138014554977417, 0.00025659799575805664, 0.0003751814365386963, 0.0004937648773193359, 0.0006123483180999756, 0.0007309317588806152, 0.0008495151996612549, 0.0009680986404418945, 0.0010866820812225342, 0.0012052655220031738, 0.0013238489627838135, 0.0014424324035644531, 0.0015610158443450928, 0.0016795992851257324, 0.001798182725906372, 0.0019167661666870117, 0.0020353496074676514, 0.002153933048248291, 0.0022725164890289307, 0.0023910999298095703, 0.00250968337059021, 0.0026282668113708496, 0.0027468502521514893, 0.002865433692932129, 0.0029840171337127686, 0.003102600574493408, 0.003221184015274048, 0.0033397674560546875]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 6.0, 9.0, 8.0, 15.0, 24.0, 29.0, 44.0, 62.0, 88.0, 121.0, 188.0, 269.0, 426.0, 635.0, 891.0, 1353.0, 2067.0, 3305.0, 5588.0, 9314.0, 16488.0, 31356.0, 64430.0, 146021.0, 392994.0, 1505143.0, 1373967.0, 369207.0, 138974.0, 61305.0, 30367.0, 15813.0, 9068.0, 5199.0, 3412.0, 2041.0, 1370.0, 855.0, 580.0, 394.0, 266.0, 182.0, 119.0, 93.0, 56.0, 60.0, 26.0, 20.0, 17.0, 5.0, 8.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0], "bins": [-0.00821685791015625, -0.007959842681884766, -0.007702827453613281, -0.007445812225341797, -0.0071887969970703125, -0.006931781768798828, -0.006674766540527344, -0.006417751312255859, -0.006160736083984375, -0.005903720855712891, -0.005646705627441406, -0.005389690399169922, -0.0051326751708984375, -0.004875659942626953, -0.004618644714355469, -0.004361629486083984, -0.0041046142578125, -0.0038475990295410156, -0.0035905838012695312, -0.003333568572998047, -0.0030765533447265625, -0.002819538116455078, -0.0025625228881835938, -0.0023055076599121094, -0.002048492431640625, -0.0017914772033691406, -0.0015344619750976562, -0.0012774467468261719, -0.0010204315185546875, -0.0007634162902832031, -0.0005064010620117188, -0.0002493858337402344, 7.62939453125e-06, 0.0002646446228027344, 0.0005216598510742188, 0.0007786750793457031, 0.0010356903076171875, 0.0012927055358886719, 0.0015497207641601562, 0.0018067359924316406, 0.002063751220703125, 0.0023207664489746094, 0.0025777816772460938, 0.002834796905517578, 0.0030918121337890625, 0.003348827362060547, 0.0036058425903320312, 0.0038628578186035156, 0.004119873046875, 0.004376888275146484, 0.004633903503417969, 0.004890918731689453, 0.0051479339599609375, 0.005404949188232422, 0.005661964416503906, 0.005918979644775391, 0.006175994873046875, 0.006433010101318359, 0.006690025329589844, 0.006947040557861328, 0.0072040557861328125, 0.007461071014404297, 0.007718086242675781, 0.007975101470947266, 0.00823211669921875]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 2.0, 3.0, 3.0, 15.0, 17.0, 13.0, 13.0, 24.0, 23.0, 25.0, 31.0, 46.0, 59.0, 68.0, 76.0, 99.0, 137.0, 167.0, 213.0, 229.0, 312.0, 346.0, 400.0, 334.0, 292.0, 234.0, 184.0, 146.0, 122.0, 101.0, 62.0, 62.0, 52.0, 34.0, 29.0, 26.0, 21.0, 15.0, 12.0, 10.0, 6.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.002162933349609375, -0.0020957589149475098, -0.0020285844802856445, -0.0019614100456237793, -0.001894235610961914, -0.0018270611763000488, -0.0017598867416381836, -0.0016927123069763184, -0.0016255378723144531, -0.0015583634376525879, -0.0014911890029907227, -0.0014240145683288574, -0.0013568401336669922, -0.001289665699005127, -0.0012224912643432617, -0.0011553168296813965, -0.0010881423950195312, -0.001020967960357666, -0.0009537935256958008, -0.0008866190910339355, -0.0008194446563720703, -0.0007522702217102051, -0.0006850957870483398, -0.0006179213523864746, -0.0005507469177246094, -0.00048357248306274414, -0.0004163980484008789, -0.00034922361373901367, -0.00028204917907714844, -0.0002148747444152832, -0.00014770030975341797, -8.052587509155273e-05, -1.33514404296875e-05, 5.3822994232177734e-05, 0.00012099742889404297, 0.0001881718635559082, 0.00025534629821777344, 0.00032252073287963867, 0.0003896951675415039, 0.00045686960220336914, 0.0005240440368652344, 0.0005912184715270996, 0.0006583929061889648, 0.0007255673408508301, 0.0007927417755126953, 0.0008599162101745605, 0.0009270906448364258, 0.000994265079498291, 0.0010614395141601562, 0.0011286139488220215, 0.0011957883834838867, 0.001262962818145752, 0.0013301372528076172, 0.0013973116874694824, 0.0014644861221313477, 0.0015316605567932129, 0.0015988349914550781, 0.0016660094261169434, 0.0017331838607788086, 0.0018003582954406738, 0.001867532730102539, 0.0019347071647644043, 0.0020018815994262695, 0.0020690560340881348, 0.00213623046875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 9.0, 16.0, 13.0, 18.0, 18.0, 28.0, 39.0, 39.0, 67.0, 89.0, 97.0, 121.0, 110.0, 79.0, 71.0, 44.0, 32.0, 25.0, 21.0, 9.0, 11.0, 13.0, 10.0, 8.0, 1.0, 2.0, 1.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0062970626167953014, -0.0060974848456680775, -0.005897906608879566, -0.005698328837752342, -0.005498751066625118, -0.005299173295497894, -0.005099595058709383, -0.004900017287582159, -0.004700439050793648, -0.004500861279666424, -0.0043012830428779125, -0.0041017052717506886, -0.0039021275006234646, -0.003702549496665597, -0.0035029714927077293, -0.0033033937215805054, -0.0031038159504532814, -0.0029042379464954138, -0.00270466017536819, -0.002505082171410322, -0.0023055044002830982, -0.0021059263963252306, -0.001906348392367363, -0.0017067705048248172, -0.0015071926172822714, -0.0013076147297397256, -0.0011080368421971798, -0.0009084588382393122, -0.0007088809506967664, -0.0005093030631542206, -0.00030972505919635296, -0.00011014717165380716, 8.943118155002594e-05, 0.0002890090981964022, 0.0004885870148427784, 0.0006881649605929852, 0.000887742848135531, 0.0010873207356780767, 0.0012868987396359444, 0.0014864766271784902, 0.001686054514721036, 0.0018856324022635818, 0.0020852102898061275, 0.002284788293763995, 0.002484366297721863, 0.0026839440688490868, 0.0028835220728069544, 0.003083100076764822, 0.003282677847892046, 0.0034822558518499136, 0.0036818336229771376, 0.003881411626935005, 0.004080989398062229, 0.004280567169189453, 0.004480145405977964, 0.004679723177105188, 0.0048793014138937, 0.005078879185020924, 0.005278457421809435, 0.005478035192936659, 0.005677612964063883, 0.005877191200852394, 0.006076768971979618, 0.006276346743106842, 0.006475924514234066]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 11.0, 4.0, 8.0, 6.0, 7.0, 14.0, 15.0, 23.0, 14.0, 21.0, 23.0, 38.0, 27.0, 37.0, 44.0, 46.0, 46.0, 48.0, 43.0, 45.0, 57.0, 42.0, 35.0, 37.0, 40.0, 38.0, 35.0, 30.0, 22.0, 23.0, 25.0, 17.0, 25.0, 18.0, 6.0, 5.0, 8.0, 6.0, 5.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0044275932013988495, -0.0042918529361486435, -0.0041561126708984375, -0.004020372871309519, -0.003884632606059313, -0.003748892340809107, -0.003613152075558901, -0.003477411810308695, -0.0033416717778891325, -0.0032059315126389265, -0.003070191480219364, -0.002934451214969158, -0.002798710949718952, -0.00266297091729939, -0.002527230652049184, -0.0023914906196296215, -0.0022557503543794155, -0.0021200100891292095, -0.001984270056709647, -0.0018485297914594412, -0.001712789642624557, -0.0015770494937896729, -0.0014413092285394669, -0.0013055690797045827, -0.0011698289308696985, -0.0010340887820348144, -0.0008983485749922693, -0.0007626083679497242, -0.00062686821911484, -0.0004911280702799559, -0.0003553878632374108, -0.0002196476561948657, -8.390750735998154e-05, 5.1832670578733087e-05, 0.0001875728485174477, 0.00032331302645616233, 0.00045905320439487696, 0.0005947933532297611, 0.0007305335602723062, 0.0008662737673148513, 0.0010020139161497355, 0.0011377540649846196, 0.0012734942138195038, 0.0014092344790697098, 0.001544974627904594, 0.0016807147767394781, 0.001816455041989684, 0.0019521951908245683, 0.0020879353396594524, 0.0022236756049096584, 0.0023594156373292208, 0.0024951559025794268, 0.002630895934998989, 0.002766636200249195, 0.002902376465499401, 0.003038116730749607, 0.0031738567631691694, 0.0033095970284193754, 0.0034453370608389378, 0.0035810773260891438, 0.0037168175913393497, 0.003852557623758912, 0.003988297656178474, 0.00412403792142868, 0.004259778186678886]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 6.0, 8.0, 6.0, 13.0, 20.0, 23.0, 25.0, 42.0, 51.0, 78.0, 112.0, 155.0, 295.0, 482.0, 743.0, 1234.0, 2256.0, 4319.0, 8693.0, 19476.0, 49969.0, 155598.0, 490184.0, 207210.0, 62376.0, 23828.0, 10286.0, 4815.0, 2564.0, 1375.0, 829.0, 473.0, 338.0, 192.0, 146.0, 93.0, 79.0, 48.0, 26.0, 19.0, 18.0, 14.0, 11.0, 10.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002048492431640625, -0.0019856691360473633, -0.0019228458404541016, -0.0018600225448608398, -0.0017971992492675781, -0.0017343759536743164, -0.0016715526580810547, -0.001608729362487793, -0.0015459060668945312, -0.0014830827713012695, -0.0014202594757080078, -0.001357436180114746, -0.0012946128845214844, -0.0012317895889282227, -0.001168966293334961, -0.0011061429977416992, -0.0010433197021484375, -0.0009804964065551758, -0.0009176731109619141, -0.0008548498153686523, -0.0007920265197753906, -0.0007292032241821289, -0.0006663799285888672, -0.0006035566329956055, -0.0005407333374023438, -0.00047791004180908203, -0.0004150867462158203, -0.0003522634506225586, -0.0002894401550292969, -0.00022661685943603516, -0.00016379356384277344, -0.00010097026824951172, -3.814697265625e-05, 2.467632293701172e-05, 8.749961853027344e-05, 0.00015032291412353516, 0.00021314620971679688, 0.0002759695053100586, 0.0003387928009033203, 0.00040161609649658203, 0.00046443939208984375, 0.0005272626876831055, 0.0005900859832763672, 0.0006529092788696289, 0.0007157325744628906, 0.0007785558700561523, 0.0008413791656494141, 0.0009042024612426758, 0.0009670257568359375, 0.0010298490524291992, 0.001092672348022461, 0.0011554956436157227, 0.0012183189392089844, 0.001281142234802246, 0.0013439655303955078, 0.0014067888259887695, 0.0014696121215820312, 0.001532435417175293, 0.0015952587127685547, 0.0016580820083618164, 0.0017209053039550781, 0.0017837285995483398, 0.0018465518951416016, 0.0019093751907348633, 0.001972198486328125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 6.0, 6.0, 7.0, 8.0, 21.0, 19.0, 13.0, 28.0, 36.0, 33.0, 42.0, 41.0, 39.0, 53.0, 51.0, 39.0, 61.0, 66.0, 49.0, 36.0, 40.0, 37.0, 44.0, 28.0, 28.0, 27.0, 21.0, 17.0, 21.0, 23.0, 10.0, 9.0, 6.0, 8.0, 4.0, 2.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004955291748046875, -0.004803895950317383, -0.004652500152587891, -0.0045011043548583984, -0.004349708557128906, -0.004198312759399414, -0.004046916961669922, -0.0038955211639404297, -0.0037441253662109375, -0.0035927295684814453, -0.003441333770751953, -0.003289937973022461, -0.0031385421752929688, -0.0029871463775634766, -0.0028357505798339844, -0.002684354782104492, -0.002532958984375, -0.002381563186645508, -0.0022301673889160156, -0.0020787715911865234, -0.0019273757934570312, -0.001775979995727539, -0.0016245841979980469, -0.0014731884002685547, -0.0013217926025390625, -0.0011703968048095703, -0.0010190010070800781, -0.0008676052093505859, -0.0007162094116210938, -0.0005648136138916016, -0.0004134178161621094, -0.0002620220184326172, -0.000110626220703125, 4.076957702636719e-05, 0.00019216537475585938, 0.00034356117248535156, 0.0004949569702148438, 0.0006463527679443359, 0.0007977485656738281, 0.0009491443634033203, 0.0011005401611328125, 0.0012519359588623047, 0.0014033317565917969, 0.001554727554321289, 0.0017061233520507812, 0.0018575191497802734, 0.0020089149475097656, 0.002160310745239258, 0.00231170654296875, 0.002463102340698242, 0.0026144981384277344, 0.0027658939361572266, 0.0029172897338867188, 0.003068685531616211, 0.003220081329345703, 0.0033714771270751953, 0.0035228729248046875, 0.0036742687225341797, 0.003825664520263672, 0.003977060317993164, 0.004128456115722656, 0.0042798519134521484, 0.004431247711181641, 0.004582643508911133, 0.004734039306640625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 7.0, 4.0, 3.0, 2.0, 4.0, 7.0, 8.0, 17.0, 23.0, 23.0, 31.0, 50.0, 78.0, 108.0, 135.0, 196.0, 289.0, 463.0, 590.0, 965.0, 1635.0, 2636.0, 4720.0, 8686.0, 16768.0, 36180.0, 88370.0, 289148.0, 397992.0, 112125.0, 43639.0, 19952.0, 10134.0, 5393.0, 3044.0, 1838.0, 1072.0, 752.0, 438.0, 325.0, 192.0, 180.0, 93.0, 77.0, 44.0, 41.0, 21.0, 24.0, 15.0, 10.0, 8.0, 6.0, 4.0, 3.0, 0.0, 0.0, 3.0], "bins": [-0.002101898193359375, -0.002042040228843689, -0.001982182264328003, -0.001922324299812317, -0.0018624663352966309, -0.0018026083707809448, -0.0017427504062652588, -0.0016828924417495728, -0.0016230344772338867, -0.0015631765127182007, -0.0015033185482025146, -0.0014434605836868286, -0.0013836026191711426, -0.0013237446546554565, -0.0012638866901397705, -0.0012040287256240845, -0.0011441707611083984, -0.0010843127965927124, -0.0010244548320770264, -0.0009645968675613403, -0.0009047389030456543, -0.0008448809385299683, -0.0007850229740142822, -0.0007251650094985962, -0.0006653070449829102, -0.0006054490804672241, -0.0005455911159515381, -0.00048573315143585205, -0.000425875186920166, -0.00036601722240448, -0.00030615925788879395, -0.0002463012933731079, -0.00018644332885742188, -0.00012658536434173584, -6.67273998260498e-05, -6.8694353103637695e-06, 5.2988529205322266e-05, 0.0001128464937210083, 0.00017270445823669434, 0.00023256242275238037, 0.0002924203872680664, 0.00035227835178375244, 0.0004121363162994385, 0.0004719942808151245, 0.0005318522453308105, 0.0005917102098464966, 0.0006515681743621826, 0.0007114261388778687, 0.0007712841033935547, 0.0008311420679092407, 0.0008910000324249268, 0.0009508579969406128, 0.0010107159614562988, 0.0010705739259719849, 0.001130431890487671, 0.001190289855003357, 0.001250147819519043, 0.001310005784034729, 0.001369863748550415, 0.001429721713066101, 0.0014895796775817871, 0.0015494376420974731, 0.0016092956066131592, 0.0016691535711288452, 0.0017290115356445312]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 7.0, 8.0, 5.0, 3.0, 11.0, 3.0, 7.0, 8.0, 10.0, 11.0, 21.0, 16.0, 17.0, 23.0, 25.0, 23.0, 27.0, 30.0, 26.0, 22.0, 43.0, 34.0, 38.0, 28.0, 36.0, 40.0, 33.0, 37.0, 46.0, 35.0, 36.0, 28.0, 32.0, 25.0, 26.0, 21.0, 21.0, 23.0, 20.0, 10.0, 11.0, 14.0, 14.0, 11.0, 9.0, 8.0, 3.0, 6.0, 4.0, 6.0, 6.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00225830078125, -0.00218355655670166, -0.0021088123321533203, -0.0020340681076049805, -0.0019593238830566406, -0.0018845796585083008, -0.001809835433959961, -0.001735091209411621, -0.0016603469848632812, -0.0015856027603149414, -0.0015108585357666016, -0.0014361143112182617, -0.0013613700866699219, -0.001286625862121582, -0.0012118816375732422, -0.0011371374130249023, -0.0010623931884765625, -0.0009876489639282227, -0.0009129047393798828, -0.000838160514831543, -0.0007634162902832031, -0.0006886720657348633, -0.0006139278411865234, -0.0005391836166381836, -0.00046443939208984375, -0.0003896951675415039, -0.00031495094299316406, -0.00024020671844482422, -0.00016546249389648438, -9.071826934814453e-05, -1.5974044799804688e-05, 5.8770179748535156e-05, 0.000133514404296875, 0.00020825862884521484, 0.0002830028533935547, 0.00035774707794189453, 0.0004324913024902344, 0.0005072355270385742, 0.0005819797515869141, 0.0006567239761352539, 0.0007314682006835938, 0.0008062124252319336, 0.0008809566497802734, 0.0009557008743286133, 0.0010304450988769531, 0.001105189323425293, 0.0011799335479736328, 0.0012546777725219727, 0.0013294219970703125, 0.0014041662216186523, 0.0014789104461669922, 0.001553654670715332, 0.0016283988952636719, 0.0017031431198120117, 0.0017778873443603516, 0.0018526315689086914, 0.0019273757934570312, 0.002002120018005371, 0.002076864242553711, 0.0021516084671020508, 0.0022263526916503906, 0.0023010969161987305, 0.0023758411407470703, 0.00245058536529541, 0.00252532958984375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 5.0, 14.0, 14.0, 26.0, 18.0, 26.0, 28.0, 57.0, 88.0, 111.0, 175.0, 209.0, 277.0, 460.0, 659.0, 1021.0, 1533.0, 2306.0, 3918.0, 6457.0, 11558.0, 22095.0, 47388.0, 134677.0, 544501.0, 161818.0, 53952.0, 24220.0, 12362.0, 6976.0, 4028.0, 2574.0, 1649.0, 1000.0, 712.0, 503.0, 368.0, 228.0, 155.0, 110.0, 85.0, 49.0, 52.0, 33.0, 24.0, 13.0, 7.0, 3.0, 2.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.00019168853759765625, -0.00018597766757011414, -0.00018026679754257202, -0.0001745559275150299, -0.0001688450574874878, -0.00016313418745994568, -0.00015742331743240356, -0.00015171244740486145, -0.00014600157737731934, -0.00014029070734977722, -0.0001345798373222351, -0.000128868967294693, -0.00012315809726715088, -0.00011744722723960876, -0.00011173635721206665, -0.00010602548718452454, -0.00010031461715698242, -9.460374712944031e-05, -8.88928771018982e-05, -8.318200707435608e-05, -7.747113704681396e-05, -7.176026701927185e-05, -6.604939699172974e-05, -6.033852696418762e-05, -5.462765693664551e-05, -4.8916786909103394e-05, -4.320591688156128e-05, -3.7495046854019165e-05, -3.178417682647705e-05, -2.6073306798934937e-05, -2.0362436771392822e-05, -1.4651566743850708e-05, -8.940696716308594e-06, -3.2298266887664795e-06, 2.4810433387756348e-06, 8.191913366317749e-06, 1.3902783393859863e-05, 1.9613653421401978e-05, 2.5324523448944092e-05, 3.1035393476486206e-05, 3.674626350402832e-05, 4.2457133531570435e-05, 4.816800355911255e-05, 5.387887358665466e-05, 5.958974361419678e-05, 6.530061364173889e-05, 7.1011483669281e-05, 7.672235369682312e-05, 8.243322372436523e-05, 8.814409375190735e-05, 9.385496377944946e-05, 9.956583380699158e-05, 0.00010527670383453369, 0.0001109875738620758, 0.00011669844388961792, 0.00012240931391716003, 0.00012812018394470215, 0.00013383105397224426, 0.00013954192399978638, 0.0001452527940273285, 0.0001509636640548706, 0.00015667453408241272, 0.00016238540410995483, 0.00016809627413749695, 0.00017380714416503906]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 0.0, 5.0, 3.0, 4.0, 9.0, 11.0, 9.0, 8.0, 0.0, 19.0, 24.0, 17.0, 36.0, 40.0, 42.0, 53.0, 0.0, 66.0, 62.0, 67.0, 63.0, 82.0, 55.0, 55.0, 0.0, 61.0, 44.0, 36.0, 29.0, 24.0, 18.0, 19.0, 0.0, 9.0, 11.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8477439880371094e-06, -1.7955899238586426e-06, -1.7434358596801758e-06, -1.691281795501709e-06, -1.6391277313232422e-06, -1.5869736671447754e-06, -1.5348196029663086e-06, -1.4826655387878418e-06, -1.430511474609375e-06, -1.3783574104309082e-06, -1.3262033462524414e-06, -1.2740492820739746e-06, -1.2218952178955078e-06, -1.169741153717041e-06, -1.1175870895385742e-06, -1.0654330253601074e-06, -1.0132789611816406e-06, -9.611248970031738e-07, -9.08970832824707e-07, -8.568167686462402e-07, -8.046627044677734e-07, -7.525086402893066e-07, -7.003545761108398e-07, -6.48200511932373e-07, -5.960464477539062e-07, -5.438923835754395e-07, -4.917383193969727e-07, -4.3958425521850586e-07, -3.8743019104003906e-07, -3.3527612686157227e-07, -2.8312206268310547e-07, -2.3096799850463867e-07, -1.7881393432617188e-07, -1.2665987014770508e-07, -7.450580596923828e-08, -2.2351741790771484e-08, 2.9802322387695312e-08, 8.195638656616211e-08, 1.341104507446289e-07, 1.862645149230957e-07, 2.384185791015625e-07, 2.905726432800293e-07, 3.427267074584961e-07, 3.948807716369629e-07, 4.470348358154297e-07, 4.991888999938965e-07, 5.513429641723633e-07, 6.034970283508301e-07, 6.556510925292969e-07, 7.078051567077637e-07, 7.599592208862305e-07, 8.121132850646973e-07, 8.642673492431641e-07, 9.164214134216309e-07, 9.685754776000977e-07, 1.0207295417785645e-06, 1.0728836059570312e-06, 1.125037670135498e-06, 1.1771917343139648e-06, 1.2293457984924316e-06, 1.2814998626708984e-06, 1.3336539268493652e-06, 1.385807991027832e-06, 1.4379620552062988e-06, 1.4901161193847656e-06]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 7.0, 6.0, 14.0, 14.0, 28.0, 35.0, 45.0, 64.0, 79.0, 158.0, 200.0, 291.0, 420.0, 563.0, 939.0, 1418.0, 2232.0, 3560.0, 5704.0, 10061.0, 18188.0, 35049.0, 73302.0, 176736.0, 428363.0, 152775.0, 65782.0, 31845.0, 16611.0, 9285.0, 5423.0, 3273.0, 2049.0, 1318.0, 846.0, 589.0, 409.0, 281.0, 176.0, 118.0, 87.0, 64.0, 42.0, 34.0, 24.0, 23.0, 10.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0003669261932373047, -0.00035525113344192505, -0.0003435760736465454, -0.00033190101385116577, -0.00032022595405578613, -0.0003085508942604065, -0.00029687583446502686, -0.0002852007746696472, -0.0002735257148742676, -0.00026185065507888794, -0.0002501755952835083, -0.00023850053548812866, -0.00022682547569274902, -0.00021515041589736938, -0.00020347535610198975, -0.0001918002963066101, -0.00018012523651123047, -0.00016845017671585083, -0.0001567751169204712, -0.00014510005712509155, -0.00013342499732971191, -0.00012174993753433228, -0.00011007487773895264, -9.8399817943573e-05, -8.672475814819336e-05, -7.504969835281372e-05, -6.337463855743408e-05, -5.169957876205444e-05, -4.0024518966674805e-05, -2.8349459171295166e-05, -1.6674399375915527e-05, -4.999339580535889e-06, 6.67572021484375e-06, 1.835078001022339e-05, 3.0025839805603027e-05, 4.1700899600982666e-05, 5.3375959396362305e-05, 6.505101919174194e-05, 7.672607898712158e-05, 8.840113878250122e-05, 0.00010007619857788086, 0.0001117512583732605, 0.00012342631816864014, 0.00013510137796401978, 0.00014677643775939941, 0.00015845149755477905, 0.0001701265573501587, 0.00018180161714553833, 0.00019347667694091797, 0.0002051517367362976, 0.00021682679653167725, 0.00022850185632705688, 0.00024017691612243652, 0.00025185197591781616, 0.0002635270357131958, 0.00027520209550857544, 0.0002868771553039551, 0.0002985522150993347, 0.00031022727489471436, 0.000321902334690094, 0.00033357739448547363, 0.00034525245428085327, 0.0003569275140762329, 0.00036860257387161255, 0.0003802776336669922]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 6.0, 2.0, 0.0, 1.0, 5.0, 4.0, 6.0, 9.0, 12.0, 12.0, 14.0, 11.0, 18.0, 23.0, 25.0, 28.0, 29.0, 36.0, 27.0, 44.0, 43.0, 39.0, 48.0, 46.0, 45.0, 51.0, 42.0, 49.0, 39.0, 45.0, 28.0, 35.0, 33.0, 27.0, 25.0, 18.0, 17.0, 10.0, 8.0, 8.0, 5.0, 8.0, 7.0, 9.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.611513137817383e-05, -7.353536784648895e-05, -7.095560431480408e-05, -6.83758407831192e-05, -6.579607725143433e-05, -6.321631371974945e-05, -6.0636550188064575e-05, -5.80567866563797e-05, -5.5477023124694824e-05, -5.289725959300995e-05, -5.031749606132507e-05, -4.77377325296402e-05, -4.515796899795532e-05, -4.257820546627045e-05, -3.999844193458557e-05, -3.7418678402900696e-05, -3.483891487121582e-05, -3.2259151339530945e-05, -2.967938780784607e-05, -2.7099624276161194e-05, -2.451986074447632e-05, -2.1940097212791443e-05, -1.9360333681106567e-05, -1.6780570149421692e-05, -1.4200806617736816e-05, -1.1621043086051941e-05, -9.041279554367065e-06, -6.46151602268219e-06, -3.8817524909973145e-06, -1.301988959312439e-06, 1.2777745723724365e-06, 3.857538104057312e-06, 6.4373016357421875e-06, 9.017065167427063e-06, 1.1596828699111938e-05, 1.4176592230796814e-05, 1.675635576248169e-05, 1.9336119294166565e-05, 2.191588282585144e-05, 2.4495646357536316e-05, 2.707540988922119e-05, 2.9655173420906067e-05, 3.223493695259094e-05, 3.481470048427582e-05, 3.739446401596069e-05, 3.997422754764557e-05, 4.2553991079330444e-05, 4.513375461101532e-05, 4.7713518142700195e-05, 5.029328167438507e-05, 5.2873045206069946e-05, 5.545280873775482e-05, 5.80325722694397e-05, 6.061233580112457e-05, 6.319209933280945e-05, 6.577186286449432e-05, 6.83516263961792e-05, 7.093138992786407e-05, 7.351115345954895e-05, 7.609091699123383e-05, 7.86706805229187e-05, 8.125044405460358e-05, 8.383020758628845e-05, 8.640997111797333e-05, 8.89897346496582e-05]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 17.0, 9.0, 20.0, 19.0, 26.0, 35.0, 42.0, 56.0, 86.0, 93.0, 117.0, 108.0, 97.0, 57.0, 57.0, 37.0, 27.0, 21.0, 12.0, 12.0, 10.0, 9.0, 12.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006089828442782164, -0.005891638342291117, -0.00569344824180007, -0.005495258141309023, -0.005297068040817976, -0.005098877940326929, -0.004900687374174595, -0.004702497273683548, -0.004504307173192501, -0.004306117072701454, -0.004107926972210407, -0.00390973687171936, -0.0037115467712283134, -0.0035133566707372665, -0.003315166337415576, -0.003116976236924529, -0.002918786369264126, -0.002720596268773079, -0.002522406168282032, -0.002324216067790985, -0.002126025967299938, -0.0019278357503935695, -0.0017296455334872007, -0.0015314554329961538, -0.001333265332505107, -0.00113507523201406, -0.0009368850733153522, -0.0007386949146166444, -0.0005405048141255975, -0.00034231471363455057, -0.00014412449672818184, 5.4065603762865067e-05, 0.0002522561699151993, 0.00045044629951007664, 0.000648636429104954, 0.0008468265878036618, 0.0010450166882947087, 0.0012432067887857556, 0.0014413970056921244, 0.0016395871061831713, 0.0018377772066742182, 0.002035967307165265, 0.002234157407656312, 0.0024323477409780025, 0.0026305378414690495, 0.0028287279419600964, 0.0030269180424511433, 0.00322510814294219, 0.003423298243433237, 0.003621488343924284, 0.003819678444415331, 0.004017868544906378, 0.004216058645397425, 0.004414248745888472, 0.004612439312040806, 0.004810629412531853, 0.0050088195130229, 0.0052070096135139465, 0.0054051997140049934, 0.00560338981449604, 0.005801579914987087, 0.005999770015478134, 0.006197960115969181, 0.006396150216460228, 0.006594340316951275]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 9.0, 5.0, 8.0, 7.0, 4.0, 14.0, 13.0, 23.0, 13.0, 21.0, 26.0, 35.0, 28.0, 35.0, 43.0, 42.0, 49.0, 45.0, 47.0, 46.0, 52.0, 46.0, 34.0, 42.0, 35.0, 37.0, 41.0, 31.0, 23.0, 23.0, 21.0, 17.0, 27.0, 19.0, 9.0, 4.0, 6.0, 7.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0044693537056446075, -0.004333192016929388, -0.004197030793875456, -0.004060869105160236, -0.003924707882106304, -0.0037885461933910847, -0.003652384504675865, -0.0035162230487912893, -0.0033800615929067135, -0.0032439001370221376, -0.003107738681137562, -0.0029715769924223423, -0.0028354155365377665, -0.0026992540806531906, -0.002563092391937971, -0.0024269309360533953, -0.0022907694801688194, -0.0021546080242842436, -0.0020184465683996677, -0.0018822848796844482, -0.0017461234237998724, -0.0016099619679152966, -0.0014738003956153989, -0.0013376388233155012, -0.0012014773674309254, -0.0010653159115463495, -0.0009291543392464519, -0.0007929928251542151, -0.0006568313110619783, -0.0005206697969697416, -0.0003845082828775048, -0.00024834676878526807, -0.000112184789031744, 2.3976725060492754e-05, 0.0001601382391527295, 0.00029629975324496627, 0.000432461267337203, 0.0005686227814294398, 0.0007047842955216765, 0.0008409458096139133, 0.00097710732370615, 0.001113268779590726, 0.0012494303518906236, 0.0013855919241905212, 0.001521753380075097, 0.001657914835959673, 0.0017940764082595706, 0.0019302379805594683, 0.002066399436444044, 0.00220256089232862, 0.002338722348213196, 0.0024748840369284153, 0.002611045492812991, 0.002747206948697567, 0.0028833686374127865, 0.0030195300932973623, 0.003155691549181938, 0.003291853005066514, 0.00342801446095109, 0.0035641761496663094, 0.003700337605550885, 0.003836499061435461, 0.0039726607501506805, 0.004108821973204613, 0.004244983661919832]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 11.0, 8.0, 18.0, 17.0, 37.0, 47.0, 76.0, 99.0, 135.0, 207.0, 278.0, 389.0, 667.0, 916.0, 1424.0, 2099.0, 3157.0, 4815.0, 7616.0, 12024.0, 19887.0, 33430.0, 58613.0, 113061.0, 242504.0, 264573.0, 125478.0, 63437.0, 35674.0, 21223.0, 13024.0, 8289.0, 5176.0, 3356.0, 2272.0, 1467.0, 970.0, 643.0, 436.0, 290.0, 221.0, 167.0, 110.0, 49.0, 49.0, 37.0, 29.0, 14.0, 17.0, 10.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.008148193359375, -0.007885932922363281, -0.0076236724853515625, -0.007361412048339844, -0.007099151611328125, -0.006836891174316406, -0.0065746307373046875, -0.006312370300292969, -0.00605010986328125, -0.005787849426269531, -0.0055255889892578125, -0.005263328552246094, -0.005001068115234375, -0.004738807678222656, -0.0044765472412109375, -0.004214286804199219, -0.0039520263671875, -0.0036897659301757812, -0.0034275054931640625, -0.0031652450561523438, -0.002902984619140625, -0.0026407241821289062, -0.0023784637451171875, -0.0021162033081054688, -0.00185394287109375, -0.0015916824340820312, -0.0013294219970703125, -0.0010671615600585938, -0.000804901123046875, -0.0005426406860351562, -0.0002803802490234375, -1.811981201171875e-05, 0.000244140625, 0.0005064010620117188, 0.0007686614990234375, 0.0010309219360351562, 0.001293182373046875, 0.0015554428100585938, 0.0018177032470703125, 0.0020799636840820312, 0.00234222412109375, 0.0026044845581054688, 0.0028667449951171875, 0.0031290054321289062, 0.003391265869140625, 0.0036535263061523438, 0.0039157867431640625, 0.004178047180175781, 0.0044403076171875, 0.004702568054199219, 0.0049648284912109375, 0.005227088928222656, 0.005489349365234375, 0.005751609802246094, 0.0060138702392578125, 0.006276130676269531, 0.00653839111328125, 0.006800651550292969, 0.0070629119873046875, 0.007325172424316406, 0.007587432861328125, 0.007849693298339844, 0.008111953735351562, 0.008374214172363281, 0.008636474609375]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 4.0, 7.0, 4.0, 6.0, 13.0, 20.0, 14.0, 16.0, 30.0, 16.0, 37.0, 31.0, 45.0, 47.0, 46.0, 51.0, 31.0, 55.0, 49.0, 48.0, 52.0, 47.0, 39.0, 47.0, 31.0, 24.0, 35.0, 28.0, 18.0, 19.0, 13.0, 25.0, 11.0, 6.0, 10.0, 8.0, 2.0, 7.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0041351318359375, -0.004007816314697266, -0.0038805007934570312, -0.003753185272216797, -0.0036258697509765625, -0.003498554229736328, -0.0033712387084960938, -0.0032439231872558594, -0.003116607666015625, -0.0029892921447753906, -0.0028619766235351562, -0.002734661102294922, -0.0026073455810546875, -0.002480030059814453, -0.0023527145385742188, -0.0022253990173339844, -0.00209808349609375, -0.0019707679748535156, -0.0018434524536132812, -0.0017161369323730469, -0.0015888214111328125, -0.0014615058898925781, -0.0013341903686523438, -0.0012068748474121094, -0.001079559326171875, -0.0009522438049316406, -0.0008249282836914062, -0.0006976127624511719, -0.0005702972412109375, -0.0004429817199707031, -0.00031566619873046875, -0.00018835067749023438, -6.103515625e-05, 6.628036499023438e-05, 0.00019359588623046875, 0.0003209114074707031, 0.0004482269287109375, 0.0005755424499511719, 0.0007028579711914062, 0.0008301734924316406, 0.000957489013671875, 0.0010848045349121094, 0.0012121200561523438, 0.0013394355773925781, 0.0014667510986328125, 0.0015940666198730469, 0.0017213821411132812, 0.0018486976623535156, 0.00197601318359375, 0.0021033287048339844, 0.0022306442260742188, 0.002357959747314453, 0.0024852752685546875, 0.002612590789794922, 0.0027399063110351562, 0.0028672218322753906, 0.002994537353515625, 0.0031218528747558594, 0.0032491683959960938, 0.003376483917236328, 0.0035037994384765625, 0.003631114959716797, 0.0037584304809570312, 0.0038857460021972656, 0.0040130615234375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 7.0, 12.0, 15.0, 13.0, 36.0, 35.0, 63.0, 73.0, 137.0, 181.0, 258.0, 346.0, 594.0, 817.0, 1290.0, 1871.0, 2857.0, 4517.0, 6954.0, 11130.0, 18551.0, 31337.0, 54968.0, 100980.0, 201471.0, 280422.0, 145996.0, 76101.0, 42815.0, 24785.0, 14835.0, 8965.0, 5566.0, 3519.0, 2330.0, 1538.0, 955.0, 654.0, 472.0, 311.0, 229.0, 163.0, 113.0, 67.0, 67.0, 44.0, 18.0, 36.0, 17.0, 6.0, 12.0, 5.0, 2.0, 1.0, 3.0, 1.0], "bins": [-0.0084686279296875, -0.008214116096496582, -0.007959604263305664, -0.007705092430114746, -0.007450580596923828, -0.00719606876373291, -0.006941556930541992, -0.006687045097351074, -0.006432533264160156, -0.006178021430969238, -0.00592350959777832, -0.005668997764587402, -0.005414485931396484, -0.005159974098205566, -0.0049054622650146484, -0.0046509504318237305, -0.0043964385986328125, -0.0041419267654418945, -0.0038874149322509766, -0.0036329030990600586, -0.0033783912658691406, -0.0031238794326782227, -0.0028693675994873047, -0.0026148557662963867, -0.0023603439331054688, -0.0021058320999145508, -0.0018513202667236328, -0.0015968084335327148, -0.0013422966003417969, -0.001087784767150879, -0.0008332729339599609, -0.000578761100769043, -0.000324249267578125, -6.973743438720703e-05, 0.00018477439880371094, 0.0004392862319946289, 0.0006937980651855469, 0.0009483098983764648, 0.0012028217315673828, 0.0014573335647583008, 0.0017118453979492188, 0.0019663572311401367, 0.0022208690643310547, 0.0024753808975219727, 0.0027298927307128906, 0.0029844045639038086, 0.0032389163970947266, 0.0034934282302856445, 0.0037479400634765625, 0.0040024518966674805, 0.0042569637298583984, 0.004511475563049316, 0.004765987396240234, 0.005020499229431152, 0.00527501106262207, 0.005529522895812988, 0.005784034729003906, 0.006038546562194824, 0.006293058395385742, 0.00654757022857666, 0.006802082061767578, 0.007056593894958496, 0.007311105728149414, 0.007565617561340332, 0.00782012939453125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 7.0, 4.0, 3.0, 10.0, 3.0, 6.0, 6.0, 8.0, 18.0, 11.0, 12.0, 18.0, 19.0, 29.0, 27.0, 34.0, 24.0, 32.0, 41.0, 32.0, 43.0, 44.0, 35.0, 40.0, 45.0, 53.0, 31.0, 28.0, 41.0, 47.0, 33.0, 30.0, 32.0, 18.0, 34.0, 21.0, 16.0, 13.0, 14.0, 7.0, 10.0, 5.0, 7.0, 7.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0021533966064453125, -0.0020817220211029053, -0.002010047435760498, -0.0019383728504180908, -0.0018666982650756836, -0.0017950236797332764, -0.0017233490943908691, -0.001651674509048462, -0.0015799999237060547, -0.0015083253383636475, -0.0014366507530212402, -0.001364976167678833, -0.0012933015823364258, -0.0012216269969940186, -0.0011499524116516113, -0.001078277826309204, -0.0010066032409667969, -0.0009349286556243896, -0.0008632540702819824, -0.0007915794849395752, -0.000719904899597168, -0.0006482303142547607, -0.0005765557289123535, -0.0005048811435699463, -0.00043320655822753906, -0.00036153197288513184, -0.0002898573875427246, -0.00021818280220031738, -0.00014650821685791016, -7.483363151550293e-05, -3.159046173095703e-06, 6.851553916931152e-05, 0.00014019012451171875, 0.00021186470985412598, 0.0002835392951965332, 0.00035521388053894043, 0.00042688846588134766, 0.0004985630512237549, 0.0005702376365661621, 0.0006419122219085693, 0.0007135868072509766, 0.0007852613925933838, 0.000856935977935791, 0.0009286105632781982, 0.0010002851486206055, 0.0010719597339630127, 0.00114363431930542, 0.0012153089046478271, 0.0012869834899902344, 0.0013586580753326416, 0.0014303326606750488, 0.001502007246017456, 0.0015736818313598633, 0.0016453564167022705, 0.0017170310020446777, 0.001788705587387085, 0.0018603801727294922, 0.0019320547580718994, 0.0020037293434143066, 0.002075403928756714, 0.002147078514099121, 0.0022187530994415283, 0.0022904276847839355, 0.0023621022701263428, 0.00243377685546875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 8.0, 9.0, 28.0, 20.0, 38.0, 40.0, 76.0, 89.0, 122.0, 157.0, 213.0, 332.0, 479.0, 757.0, 1171.0, 1787.0, 3053.0, 5266.0, 9889.0, 20627.0, 51521.0, 176896.0, 583945.0, 117283.0, 38387.0, 16344.0, 8173.0, 4509.0, 2635.0, 1623.0, 954.0, 665.0, 448.0, 295.0, 178.0, 158.0, 130.0, 75.0, 37.0, 34.0, 23.0, 22.0, 20.0, 13.0, 8.0, 5.0, 7.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0003173351287841797, -0.0003065243363380432, -0.00029571354389190674, -0.00028490275144577026, -0.0002740919589996338, -0.0002632811665534973, -0.00025247037410736084, -0.00024165958166122437, -0.0002308487892150879, -0.00022003799676895142, -0.00020922720432281494, -0.00019841641187667847, -0.000187605619430542, -0.00017679482698440552, -0.00016598403453826904, -0.00015517324209213257, -0.0001443624496459961, -0.00013355165719985962, -0.00012274086475372314, -0.00011193007230758667, -0.0001011192798614502, -9.030848741531372e-05, -7.949769496917725e-05, -6.868690252304077e-05, -5.78761100769043e-05, -4.706531763076782e-05, -3.625452518463135e-05, -2.5443732738494873e-05, -1.4632940292358398e-05, -3.822147846221924e-06, 6.988644599914551e-06, 1.7799437046051025e-05, 2.86102294921875e-05, 3.9421021938323975e-05, 5.023181438446045e-05, 6.104260683059692e-05, 7.18533992767334e-05, 8.266419172286987e-05, 9.347498416900635e-05, 0.00010428577661514282, 0.0001150965690612793, 0.00012590736150741577, 0.00013671815395355225, 0.00014752894639968872, 0.0001583397388458252, 0.00016915053129196167, 0.00017996132373809814, 0.00019077211618423462, 0.0002015829086303711, 0.00021239370107650757, 0.00022320449352264404, 0.00023401528596878052, 0.000244826078414917, 0.00025563687086105347, 0.00026644766330718994, 0.0002772584557533264, 0.0002880692481994629, 0.00029888004064559937, 0.00030969083309173584, 0.0003205016255378723, 0.0003313124179840088, 0.00034212321043014526, 0.00035293400287628174, 0.0003637447953224182, 0.0003745555877685547]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 27.0, 0.0, 0.0, 41.0, 0.0, 0.0, 0.0, 66.0, 0.0, 0.0, 108.0, 0.0, 0.0, 0.0, 140.0, 0.0, 0.0, 0.0, 230.0, 0.0, 0.0, 152.0, 0.0, 0.0, 0.0, 71.0, 0.0, 0.0, 59.0, 0.0, 0.0, 0.0, 56.0, 0.0, 0.0, 22.0, 0.0, 0.0, 0.0, 15.0, 0.0, 0.0, 9.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-5.364418029785156e-07, -5.19677996635437e-07, -5.029141902923584e-07, -4.861503839492798e-07, -4.6938657760620117e-07, -4.5262277126312256e-07, -4.3585896492004395e-07, -4.1909515857696533e-07, -4.023313522338867e-07, -3.855675458908081e-07, -3.688037395477295e-07, -3.520399332046509e-07, -3.3527612686157227e-07, -3.1851232051849365e-07, -3.0174851417541504e-07, -2.849847078323364e-07, -2.682209014892578e-07, -2.514570951461792e-07, -2.3469328880310059e-07, -2.1792948246002197e-07, -2.0116567611694336e-07, -1.8440186977386475e-07, -1.6763806343078613e-07, -1.5087425708770752e-07, -1.341104507446289e-07, -1.1734664440155029e-07, -1.0058283805847168e-07, -8.381903171539307e-08, -6.705522537231445e-08, -5.029141902923584e-08, -3.3527612686157227e-08, -1.6763806343078613e-08, 0.0, 1.6763806343078613e-08, 3.3527612686157227e-08, 5.029141902923584e-08, 6.705522537231445e-08, 8.381903171539307e-08, 1.0058283805847168e-07, 1.1734664440155029e-07, 1.341104507446289e-07, 1.5087425708770752e-07, 1.6763806343078613e-07, 1.8440186977386475e-07, 2.0116567611694336e-07, 2.1792948246002197e-07, 2.3469328880310059e-07, 2.514570951461792e-07, 2.682209014892578e-07, 2.849847078323364e-07, 3.0174851417541504e-07, 3.1851232051849365e-07, 3.3527612686157227e-07, 3.520399332046509e-07, 3.688037395477295e-07, 3.855675458908081e-07, 4.023313522338867e-07, 4.1909515857696533e-07, 4.3585896492004395e-07, 4.5262277126312256e-07, 4.6938657760620117e-07, 4.861503839492798e-07, 5.029141902923584e-07, 5.19677996635437e-07, 5.364418029785156e-07]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 5.0, 7.0, 11.0, 22.0, 25.0, 19.0, 27.0, 49.0, 51.0, 93.0, 119.0, 159.0, 207.0, 275.0, 346.0, 454.0, 593.0, 790.0, 1076.0, 1379.0, 1924.0, 2627.0, 4123.0, 6780.0, 12435.0, 26402.0, 67327.0, 219718.0, 510054.0, 109691.0, 39207.0, 16989.0, 8679.0, 5064.0, 3240.0, 2200.0, 1511.0, 1173.0, 899.0, 622.0, 547.0, 389.0, 340.0, 220.0, 181.0, 132.0, 95.0, 79.0, 59.0, 46.0, 23.0, 29.0, 18.0, 11.0, 10.0, 3.0, 4.0, 5.0, 1.0, 0.0, 3.0], "bins": [-0.0002677440643310547, -0.00025916844606399536, -0.00025059282779693604, -0.0002420172095298767, -0.00023344159126281738, -0.00022486597299575806, -0.00021629035472869873, -0.0002077147364616394, -0.00019913911819458008, -0.00019056349992752075, -0.00018198788166046143, -0.0001734122633934021, -0.00016483664512634277, -0.00015626102685928345, -0.00014768540859222412, -0.0001391097903251648, -0.00013053417205810547, -0.00012195855379104614, -0.00011338293552398682, -0.00010480731725692749, -9.623169898986816e-05, -8.765608072280884e-05, -7.908046245574951e-05, -7.050484418869019e-05, -6.192922592163086e-05, -5.335360765457153e-05, -4.477798938751221e-05, -3.620237112045288e-05, -2.7626752853393555e-05, -1.905113458633423e-05, -1.0475516319274902e-05, -1.8998980522155762e-06, 6.67572021484375e-06, 1.5251338481903076e-05, 2.3826956748962402e-05, 3.240257501602173e-05, 4.0978193283081055e-05, 4.955381155014038e-05, 5.812942981719971e-05, 6.670504808425903e-05, 7.528066635131836e-05, 8.385628461837769e-05, 9.243190288543701e-05, 0.00010100752115249634, 0.00010958313941955566, 0.00011815875768661499, 0.00012673437595367432, 0.00013530999422073364, 0.00014388561248779297, 0.0001524612307548523, 0.00016103684902191162, 0.00016961246728897095, 0.00017818808555603027, 0.0001867637038230896, 0.00019533932209014893, 0.00020391494035720825, 0.00021249055862426758, 0.0002210661768913269, 0.00022964179515838623, 0.00023821741342544556, 0.0002467930316925049, 0.0002553686499595642, 0.00026394426822662354, 0.00027251988649368286, 0.0002810955047607422]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 11.0, 6.0, 9.0, 7.0, 11.0, 24.0, 44.0, 69.0, 81.0, 119.0, 266.0, 104.0, 73.0, 56.0, 34.0, 31.0, 17.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.00011038780212402344, -0.00010707974433898926, -0.00010377168655395508, -0.0001004636287689209, -9.715557098388672e-05, -9.384751319885254e-05, -9.053945541381836e-05, -8.723139762878418e-05, -8.392333984375e-05, -8.061528205871582e-05, -7.730722427368164e-05, -7.399916648864746e-05, -7.069110870361328e-05, -6.73830509185791e-05, -6.407499313354492e-05, -6.076693534851074e-05, -5.745887756347656e-05, -5.415081977844238e-05, -5.08427619934082e-05, -4.7534704208374023e-05, -4.4226646423339844e-05, -4.0918588638305664e-05, -3.7610530853271484e-05, -3.4302473068237305e-05, -3.0994415283203125e-05, -2.7686357498168945e-05, -2.4378299713134766e-05, -2.1070241928100586e-05, -1.7762184143066406e-05, -1.4454126358032227e-05, -1.1146068572998047e-05, -7.838010787963867e-06, -4.5299530029296875e-06, -1.2218952178955078e-06, 2.086162567138672e-06, 5.3942203521728516e-06, 8.702278137207031e-06, 1.2010335922241211e-05, 1.531839370727539e-05, 1.862645149230957e-05, 2.193450927734375e-05, 2.524256706237793e-05, 2.855062484741211e-05, 3.185868263244629e-05, 3.516674041748047e-05, 3.847479820251465e-05, 4.178285598754883e-05, 4.509091377258301e-05, 4.839897155761719e-05, 5.170702934265137e-05, 5.501508712768555e-05, 5.8323144912719727e-05, 6.16312026977539e-05, 6.493926048278809e-05, 6.824731826782227e-05, 7.155537605285645e-05, 7.486343383789062e-05, 7.81714916229248e-05, 8.147954940795898e-05, 8.478760719299316e-05, 8.809566497802734e-05, 9.140372276306152e-05, 9.47117805480957e-05, 9.801983833312988e-05, 0.00010132789611816406]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 1.0, 10.0, 4.0, 7.0, 3.0, 9.0, 12.0, 24.0, 29.0, 22.0, 40.0, 45.0, 51.0, 67.0, 80.0, 97.0, 84.0, 79.0, 73.0, 53.0, 48.0, 19.0, 29.0, 26.0, 17.0, 13.0, 14.0, 9.0, 7.0, 11.0, 4.0, 4.0, 4.0, 2.0, 0.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.004386004991829395, -0.0042350622825324535, -0.004084119573235512, -0.00393317686393857, -0.0037822341546416283, -0.0036312914453446865, -0.0034803487360477448, -0.003329406026750803, -0.0031784633174538612, -0.0030275206081569195, -0.0028765778988599777, -0.002725635189563036, -0.002574692480266094, -0.0024237497709691525, -0.0022728070616722107, -0.002121864352375269, -0.001970921643078327, -0.0018199789337813854, -0.0016690362244844437, -0.001518093515187502, -0.0013671508058905602, -0.0012162080965936184, -0.0010652653872966766, -0.0009143226779997349, -0.0007633799687027931, -0.0006124372594058514, -0.0004614945501089096, -0.00031055184081196785, -0.0001596091315150261, -8.666422218084335e-06, 0.00014227628707885742, 0.0002932189963757992, 0.00044416217133402824, 0.00059510488063097, 0.0007460475899279118, 0.0008969902992248535, 0.0010479330085217953, 0.001198875717818737, 0.0013498184271156788, 0.0015007611364126205, 0.0016517038457095623, 0.001802646555006504, 0.001953589264303446, 0.0021045319736003876, 0.0022554746828973293, 0.002406417392194271, 0.002557360101491213, 0.0027083028107881546, 0.0028592455200850964, 0.003010188229382038, 0.00316113093867898, 0.0033120736479759216, 0.0034630163572728634, 0.003613959066569805, 0.003764901775866747, 0.003915844485163689, 0.00406678719446063, 0.004217729903757572, 0.004368672613054514, 0.004519615322351456, 0.0046705580316483974, 0.004821500740945339, 0.004972443450242281, 0.005123386159539223, 0.0052743288688361645]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 7.0, 7.0, 5.0, 5.0, 9.0, 7.0, 16.0, 11.0, 21.0, 17.0, 18.0, 24.0, 24.0, 31.0, 33.0, 35.0, 46.0, 42.0, 38.0, 47.0, 44.0, 42.0, 45.0, 38.0, 40.0, 42.0, 31.0, 32.0, 37.0, 31.0, 33.0, 25.0, 26.0, 14.0, 10.0, 15.0, 11.0, 10.0, 5.0, 11.0, 4.0, 7.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0035886052064597607, -0.0034701700787991285, -0.0033517349511384964, -0.003233300056308508, -0.003114864928647876, -0.0029964298009872437, -0.0028779946733266115, -0.0027595595456659794, -0.002641124650835991, -0.0025226895231753588, -0.0024042543955147266, -0.002285819500684738, -0.002167384373024106, -0.002048949245363474, -0.0019305141177028418, -0.0018120789900422096, -0.0016936438623815775, -0.0015752087347209454, -0.001456773723475635, -0.001338338595815003, -0.0012199035845696926, -0.0011014684569090605, -0.0009830333292484283, -0.0008645982597954571, -0.0007461631903424859, -0.0006277281208895147, -0.0005092930514365435, -0.00039085792377591133, -0.0002724228543229401, -0.0001539877848699689, -3.555265720933676e-05, 8.288241224363446e-05, 0.00020131748169660568, 0.0003197525511495769, 0.0004381876497063786, 0.0005566227482631803, 0.0006750578177161515, 0.0007934928871691227, 0.0009119280148297548, 0.001030363142490387, 0.0011487981537356973, 0.0012672332813963294, 0.0013856682926416397, 0.0015041034203022718, 0.001622538547962904, 0.0017409735592082143, 0.0018594086868688464, 0.0019778436981141567, 0.002096278825774789, 0.002214713953435421, 0.002333149081096053, 0.0024515842087566853, 0.0025700191035866737, 0.002688454231247306, 0.002806889358907938, 0.00292532448656857, 0.0030437596142292023, 0.0031621947418898344, 0.0032806298695504665, 0.003399064764380455, 0.003517499892041087, 0.0036359350197017193, 0.0037543701473623514, 0.0038728052750229836, 0.003991240169852972]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 11.0, 15.0, 21.0, 31.0, 37.0, 51.0, 81.0, 125.0, 152.0, 216.0, 328.0, 487.0, 613.0, 997.0, 1334.0, 2044.0, 3129.0, 4624.0, 7333.0, 11746.0, 19646.0, 34306.0, 66826.0, 166001.0, 773855.0, 2232939.0, 582862.0, 148359.0, 60718.0, 30958.0, 17512.0, 9994.0, 6128.0, 3865.0, 2419.0, 1556.0, 938.0, 679.0, 412.0, 292.0, 194.0, 136.0, 75.0, 86.0, 48.0, 39.0, 14.0, 13.0, 14.0, 9.0, 5.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.0073699951171875, -0.0071353912353515625, -0.006900787353515625, -0.0066661834716796875, -0.00643157958984375, -0.0061969757080078125, -0.005962371826171875, -0.0057277679443359375, -0.0054931640625, -0.0052585601806640625, -0.005023956298828125, -0.0047893524169921875, -0.00455474853515625, -0.0043201446533203125, -0.004085540771484375, -0.0038509368896484375, -0.0036163330078125, -0.0033817291259765625, -0.003147125244140625, -0.0029125213623046875, -0.00267791748046875, -0.0024433135986328125, -0.002208709716796875, -0.0019741058349609375, -0.001739501953125, -0.0015048980712890625, -0.001270294189453125, -0.0010356903076171875, -0.00080108642578125, -0.0005664825439453125, -0.000331878662109375, -9.72747802734375e-05, 0.0001373291015625, 0.0003719329833984375, 0.000606536865234375, 0.0008411407470703125, 0.00107574462890625, 0.0013103485107421875, 0.001544952392578125, 0.0017795562744140625, 0.00201416015625, 0.0022487640380859375, 0.002483367919921875, 0.0027179718017578125, 0.00295257568359375, 0.0031871795654296875, 0.003421783447265625, 0.0036563873291015625, 0.0038909912109375, 0.0041255950927734375, 0.004360198974609375, 0.0045948028564453125, 0.00482940673828125, 0.0050640106201171875, 0.005298614501953125, 0.0055332183837890625, 0.005767822265625, 0.0060024261474609375, 0.006237030029296875, 0.0064716339111328125, 0.00670623779296875, 0.0069408416748046875, 0.007175445556640625, 0.0074100494384765625, 0.0076446533203125]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 1.0, 4.0, 2.0, 7.0, 9.0, 6.0, 12.0, 13.0, 17.0, 22.0, 22.0, 29.0, 25.0, 20.0, 35.0, 44.0, 55.0, 46.0, 51.0, 44.0, 51.0, 51.0, 50.0, 39.0, 56.0, 40.0, 28.0, 30.0, 39.0, 29.0, 20.0, 18.0, 19.0, 11.0, 15.0, 7.0, 5.0, 8.0, 3.0, 7.0, 6.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.003139495849609375, -0.0030365288257598877, -0.0029335618019104004, -0.002830594778060913, -0.0027276277542114258, -0.0026246607303619385, -0.002521693706512451, -0.002418726682662964, -0.0023157596588134766, -0.0022127926349639893, -0.002109825611114502, -0.0020068585872650146, -0.0019038915634155273, -0.00180092453956604, -0.0016979575157165527, -0.0015949904918670654, -0.0014920234680175781, -0.0013890564441680908, -0.0012860894203186035, -0.0011831223964691162, -0.001080155372619629, -0.0009771883487701416, -0.0008742213249206543, -0.000771254301071167, -0.0006682872772216797, -0.0005653202533721924, -0.0004623532295227051, -0.0003593862056732178, -0.00025641918182373047, -0.00015345215797424316, -5.048513412475586e-05, 5.2481889724731445e-05, 0.00015544891357421875, 0.00025841593742370605, 0.00036138296127319336, 0.00046434998512268066, 0.000567317008972168, 0.0006702840328216553, 0.0007732510566711426, 0.0008762180805206299, 0.0009791851043701172, 0.0010821521282196045, 0.0011851191520690918, 0.001288086175918579, 0.0013910531997680664, 0.0014940202236175537, 0.001596987247467041, 0.0016999542713165283, 0.0018029212951660156, 0.001905888319015503, 0.0020088553428649902, 0.0021118223667144775, 0.002214789390563965, 0.002317756414413452, 0.0024207234382629395, 0.0025236904621124268, 0.002626657485961914, 0.0027296245098114014, 0.0028325915336608887, 0.002935558557510376, 0.0030385255813598633, 0.0031414926052093506, 0.003244459629058838, 0.003347426652908325, 0.0034503936767578125]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 9.0, 7.0, 15.0, 24.0, 33.0, 36.0, 62.0, 67.0, 128.0, 184.0, 283.0, 428.0, 631.0, 930.0, 1414.0, 2234.0, 3502.0, 5593.0, 9146.0, 15165.0, 26096.0, 47847.0, 91674.0, 202698.0, 617845.0, 2092931.0, 655708.0, 208856.0, 94616.0, 48717.0, 26640.0, 15671.0, 9144.0, 5579.0, 3627.0, 2280.0, 1463.0, 951.0, 686.0, 427.0, 317.0, 195.0, 125.0, 106.0, 64.0, 42.0, 35.0, 24.0, 10.0, 12.0, 2.0, 5.0, 0.0, 3.0, 1.0], "bins": [-0.007030487060546875, -0.006826817989349365, -0.0066231489181518555, -0.006419479846954346, -0.006215810775756836, -0.006012141704559326, -0.005808472633361816, -0.005604803562164307, -0.005401134490966797, -0.005197465419769287, -0.004993796348571777, -0.004790127277374268, -0.004586458206176758, -0.004382789134979248, -0.004179120063781738, -0.0039754509925842285, -0.0037717819213867188, -0.003568112850189209, -0.0033644437789916992, -0.0031607747077941895, -0.0029571056365966797, -0.00275343656539917, -0.00254976749420166, -0.0023460984230041504, -0.0021424293518066406, -0.0019387602806091309, -0.001735091209411621, -0.0015314221382141113, -0.0013277530670166016, -0.0011240839958190918, -0.000920414924621582, -0.0007167458534240723, -0.0005130767822265625, -0.00030940771102905273, -0.00010573863983154297, 9.79304313659668e-05, 0.00030159950256347656, 0.0005052685737609863, 0.0007089376449584961, 0.0009126067161560059, 0.0011162757873535156, 0.0013199448585510254, 0.0015236139297485352, 0.001727283000946045, 0.0019309520721435547, 0.0021346211433410645, 0.0023382902145385742, 0.002541959285736084, 0.0027456283569335938, 0.0029492974281311035, 0.0031529664993286133, 0.003356635570526123, 0.003560304641723633, 0.0037639737129211426, 0.003967642784118652, 0.004171311855316162, 0.004374980926513672, 0.004578649997711182, 0.004782319068908691, 0.004985988140106201, 0.005189657211303711, 0.005393326282501221, 0.0055969953536987305, 0.00580066442489624, 0.00600433349609375]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 7.0, 7.0, 9.0, 8.0, 13.0, 20.0, 25.0, 24.0, 37.0, 44.0, 54.0, 66.0, 84.0, 98.0, 98.0, 136.0, 188.0, 195.0, 308.0, 435.0, 464.0, 414.0, 300.0, 231.0, 155.0, 133.0, 98.0, 77.0, 59.0, 62.0, 50.0, 32.0, 28.0, 22.0, 17.0, 13.0, 10.0, 10.0, 8.0, 9.0, 7.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0016870498657226562, -0.0016295760869979858, -0.0015721023082733154, -0.001514628529548645, -0.0014571547508239746, -0.0013996809720993042, -0.0013422071933746338, -0.0012847334146499634, -0.001227259635925293, -0.0011697858572006226, -0.0011123120784759521, -0.0010548382997512817, -0.0009973645210266113, -0.0009398907423019409, -0.0008824169635772705, -0.0008249431848526001, -0.0007674694061279297, -0.0007099956274032593, -0.0006525218486785889, -0.0005950480699539185, -0.000537574291229248, -0.00048010051250457764, -0.0004226267337799072, -0.0003651529550552368, -0.0003076791763305664, -0.000250205397605896, -0.00019273161888122559, -0.00013525784015655518, -7.778406143188477e-05, -2.0310282707214355e-05, 3.7163496017456055e-05, 9.463727474212646e-05, 0.00015211105346679688, 0.00020958483219146729, 0.0002670586109161377, 0.0003245323896408081, 0.0003820061683654785, 0.0004394799470901489, 0.0004969537258148193, 0.0005544275045394897, 0.0006119012832641602, 0.0006693750619888306, 0.000726848840713501, 0.0007843226194381714, 0.0008417963981628418, 0.0008992701768875122, 0.0009567439556121826, 0.001014217734336853, 0.0010716915130615234, 0.0011291652917861938, 0.0011866390705108643, 0.0012441128492355347, 0.001301586627960205, 0.0013590604066848755, 0.001416534185409546, 0.0014740079641342163, 0.0015314817428588867, 0.0015889555215835571, 0.0016464293003082275, 0.001703903079032898, 0.0017613768577575684, 0.0018188506364822388, 0.0018763244152069092, 0.0019337981939315796, 0.00199127197265625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 3.0, 3.0, 5.0, 5.0, 5.0, 8.0, 17.0, 15.0, 13.0, 32.0, 38.0, 42.0, 59.0, 74.0, 85.0, 131.0, 92.0, 86.0, 69.0, 50.0, 25.0, 32.0, 17.0, 14.0, 14.0, 11.0, 20.0, 7.0, 8.0, 5.0, 2.0, 5.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00569415045902133, -0.0055389367043972015, -0.005383722949773073, -0.005228509195148945, -0.005073294974863529, -0.004918081220239401, -0.0047628674656152725, -0.004607653710991144, -0.004452439956367016, -0.0042972262017428875, -0.004142012447118759, -0.0039867982268333435, -0.003831584705039859, -0.003676370717585087, -0.0035211569629609585, -0.00336594320833683, -0.003210729220882058, -0.00305551546625793, -0.002900301478803158, -0.0027450877241790295, -0.002589873969554901, -0.0024346602149307728, -0.002279446227476001, -0.0021242324728518724, -0.0019690184853971004, -0.0018138046143576503, -0.001658590859733522, -0.0015033769886940718, -0.0013481632340699434, -0.0011929493630304933, -0.001037735491991043, -0.0008825217373669147, -0.0007273079827427864, -0.0005720941699109972, -0.00041688032797537744, -0.00026166648603975773, -0.00010645267320796847, 4.876113962382078e-05, 0.00020397501066327095, 0.0003591887652873993, 0.0005144026363268495, 0.0006696164491586387, 0.000824830261990428, 0.0009800441330298781, 0.0011352580040693283, 0.0012904717586934566, 0.0014456856297329068, 0.0016008993843570352, 0.0017561132553964853, 0.0019113271264359355, 0.0020665409974753857, 0.002221754752099514, 0.0023769685067236423, 0.0025321822613477707, 0.0026873962488025427, 0.002842610003426671, 0.002997823990881443, 0.0031530377455055714, 0.0033082517329603434, 0.0034634654875844717, 0.0036186792422086, 0.003773893229663372, 0.0039291069842875, 0.004084320738911629, 0.004239534493535757]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 5.0, 6.0, 11.0, 8.0, 11.0, 12.0, 21.0, 21.0, 19.0, 28.0, 26.0, 52.0, 40.0, 40.0, 29.0, 62.0, 42.0, 45.0, 41.0, 32.0, 37.0, 46.0, 34.0, 54.0, 36.0, 34.0, 30.0, 26.0, 29.0, 16.0, 18.0, 16.0, 17.0, 14.0, 14.0, 6.0, 3.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.003845968283712864, -0.003727878211066127, -0.003609787905588746, -0.003491697832942009, -0.0033736075274646282, -0.003255517454817891, -0.003137427382171154, -0.0030193370766937733, -0.002901247004047036, -0.002783156931400299, -0.0026650666259229183, -0.0025469765532761812, -0.002428886480629444, -0.0023107961751520634, -0.0021927061025053263, -0.002074616029858589, -0.0019565257243812084, -0.0018384355353191495, -0.0017203453462570906, -0.0016022552736103535, -0.0014841650845482945, -0.0013660748954862356, -0.0012479848228394985, -0.0011298946337774396, -0.0010118044447153807, -0.0008937142556533217, -0.0007756241247989237, -0.0006575339939445257, -0.0005394438048824668, -0.00042135361582040787, -0.00030326348496600986, -0.00018517335411161184, -6.708339788019657e-05, 5.10067620780319e-05, 0.00016909692203626037, 0.00028718708199448884, 0.0004052772419527173, 0.0005233674310147762, 0.0006414575618691742, 0.0007595476927235723, 0.0008776378817856312, 0.00099572807084769, 0.001113818259909749, 0.0012319083325564861, 0.001349998521618545, 0.001468088710680604, 0.001586178783327341, 0.0017042689723894, 0.001822359161451459, 0.0019404493505135179, 0.0020585395395755768, 0.002176629612222314, 0.002294719684869051, 0.0024128099903464317, 0.002530900062993169, 0.002648990135639906, 0.0027670804411172867, 0.0028851705137640238, 0.0030032608192414045, 0.0031213508918881416, 0.0032394411973655224, 0.0033575312700122595, 0.0034756213426589966, 0.0035937116481363773, 0.0037118017207831144]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 13.0, 16.0, 7.0, 34.0, 40.0, 59.0, 87.0, 106.0, 159.0, 218.0, 357.0, 466.0, 839.0, 1310.0, 2010.0, 3163.0, 5078.0, 8017.0, 13408.0, 23001.0, 40069.0, 75185.0, 156259.0, 309868.0, 199590.0, 92996.0, 48129.0, 26742.0, 15596.0, 9487.0, 5902.0, 3664.0, 2279.0, 1489.0, 998.0, 591.0, 439.0, 298.0, 192.0, 122.0, 79.0, 73.0, 32.0, 28.0, 24.0, 8.0, 8.0, 8.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0009775161743164062, -0.0009475797414779663, -0.0009176433086395264, -0.0008877068758010864, -0.0008577704429626465, -0.0008278340101242065, -0.0007978975772857666, -0.0007679611444473267, -0.0007380247116088867, -0.0007080882787704468, -0.0006781518459320068, -0.0006482154130935669, -0.000618278980255127, -0.000588342547416687, -0.0005584061145782471, -0.0005284696817398071, -0.0004985332489013672, -0.00046859681606292725, -0.0004386603832244873, -0.00040872395038604736, -0.0003787875175476074, -0.0003488510847091675, -0.00031891465187072754, -0.0002889782190322876, -0.00025904178619384766, -0.00022910535335540771, -0.00019916892051696777, -0.00016923248767852783, -0.0001392960548400879, -0.00010935962200164795, -7.942318916320801e-05, -4.9486756324768066e-05, -1.9550323486328125e-05, 1.0386109352111816e-05, 4.032254219055176e-05, 7.02589750289917e-05, 0.00010019540786743164, 0.00013013184070587158, 0.00016006827354431152, 0.00019000470638275146, 0.0002199411392211914, 0.00024987757205963135, 0.0002798140048980713, 0.00030975043773651123, 0.00033968687057495117, 0.0003696233034133911, 0.00039955973625183105, 0.000429496169090271, 0.00045943260192871094, 0.0004893690347671509, 0.0005193054676055908, 0.0005492419004440308, 0.0005791783332824707, 0.0006091147661209106, 0.0006390511989593506, 0.0006689876317977905, 0.0006989240646362305, 0.0007288604974746704, 0.0007587969303131104, 0.0007887333631515503, 0.0008186697959899902, 0.0008486062288284302, 0.0008785426616668701, 0.0009084790945053101, 0.00093841552734375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 4.0, 8.0, 6.0, 7.0, 12.0, 8.0, 14.0, 19.0, 14.0, 25.0, 25.0, 31.0, 33.0, 39.0, 42.0, 47.0, 52.0, 37.0, 70.0, 35.0, 43.0, 46.0, 40.0, 43.0, 46.0, 35.0, 38.0, 33.0, 24.0, 22.0, 15.0, 9.0, 23.0, 16.0, 14.0, 9.0, 7.0, 3.0, 6.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00423431396484375, -0.004103899002075195, -0.003973484039306641, -0.003843069076538086, -0.0037126541137695312, -0.0035822391510009766, -0.003451824188232422, -0.003321409225463867, -0.0031909942626953125, -0.003060579299926758, -0.002930164337158203, -0.0027997493743896484, -0.0026693344116210938, -0.002538919448852539, -0.0024085044860839844, -0.0022780895233154297, -0.002147674560546875, -0.0020172595977783203, -0.0018868446350097656, -0.001756429672241211, -0.0016260147094726562, -0.0014955997467041016, -0.0013651847839355469, -0.0012347698211669922, -0.0011043548583984375, -0.0009739398956298828, -0.0008435249328613281, -0.0007131099700927734, -0.0005826950073242188, -0.00045228004455566406, -0.0003218650817871094, -0.0001914501190185547, -6.103515625e-05, 6.937980651855469e-05, 0.00019979476928710938, 0.00033020973205566406, 0.00046062469482421875, 0.0005910396575927734, 0.0007214546203613281, 0.0008518695831298828, 0.0009822845458984375, 0.0011126995086669922, 0.0012431144714355469, 0.0013735294342041016, 0.0015039443969726562, 0.001634359359741211, 0.0017647743225097656, 0.0018951892852783203, 0.002025604248046875, 0.0021560192108154297, 0.0022864341735839844, 0.002416849136352539, 0.0025472640991210938, 0.0026776790618896484, 0.002808094024658203, 0.002938508987426758, 0.0030689239501953125, 0.003199338912963867, 0.003329753875732422, 0.0034601688385009766, 0.0035905838012695312, 0.003720998764038086, 0.0038514137268066406, 0.003981828689575195, 0.00411224365234375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 8.0, 9.0, 26.0, 22.0, 33.0, 74.0, 111.0, 160.0, 297.0, 548.0, 869.0, 1621.0, 2974.0, 5327.0, 10385.0, 20427.0, 45360.0, 115678.0, 394854.0, 287254.0, 89510.0, 36542.0, 17175.0, 8717.0, 4685.0, 2500.0, 1473.0, 788.0, 461.0, 257.0, 147.0, 95.0, 51.0, 35.0, 30.0, 18.0, 11.0, 8.0, 11.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0016078948974609375, -0.0015617907047271729, -0.0015156865119934082, -0.0014695823192596436, -0.001423478126525879, -0.0013773739337921143, -0.0013312697410583496, -0.001285165548324585, -0.0012390613555908203, -0.0011929571628570557, -0.001146852970123291, -0.0011007487773895264, -0.0010546445846557617, -0.001008540391921997, -0.0009624361991882324, -0.0009163320064544678, -0.0008702278137207031, -0.0008241236209869385, -0.0007780194282531738, -0.0007319152355194092, -0.0006858110427856445, -0.0006397068500518799, -0.0005936026573181152, -0.0005474984645843506, -0.0005013942718505859, -0.0004552900791168213, -0.00040918588638305664, -0.000363081693649292, -0.00031697750091552734, -0.0002708733081817627, -0.00022476911544799805, -0.0001786649227142334, -0.00013256072998046875, -8.64565372467041e-05, -4.035234451293945e-05, 5.751848220825195e-06, 5.1856040954589844e-05, 9.796023368835449e-05, 0.00014406442642211914, 0.0001901686191558838, 0.00023627281188964844, 0.0002823770046234131, 0.00032848119735717773, 0.0003745853900909424, 0.00042068958282470703, 0.0004667937755584717, 0.0005128979682922363, 0.000559002161026001, 0.0006051063537597656, 0.0006512105464935303, 0.0006973147392272949, 0.0007434189319610596, 0.0007895231246948242, 0.0008356273174285889, 0.0008817315101623535, 0.0009278357028961182, 0.0009739398956298828, 0.0010200440883636475, 0.0010661482810974121, 0.0011122524738311768, 0.0011583566665649414, 0.001204460859298706, 0.0012505650520324707, 0.0012966692447662354, 0.0013427734375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 1.0, 8.0, 4.0, 10.0, 4.0, 11.0, 16.0, 21.0, 13.0, 17.0, 24.0, 21.0, 14.0, 22.0, 37.0, 23.0, 32.0, 27.0, 35.0, 40.0, 33.0, 26.0, 36.0, 36.0, 38.0, 33.0, 31.0, 33.0, 34.0, 28.0, 41.0, 30.0, 32.0, 19.0, 20.0, 27.0, 23.0, 22.0, 13.0, 5.0, 13.0, 13.0, 7.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 5.0, 3.0, 2.0, 2.0], "bins": [-0.002132415771484375, -0.0020691007375717163, -0.0020057857036590576, -0.001942470669746399, -0.0018791556358337402, -0.0018158406019210815, -0.0017525255680084229, -0.0016892105340957642, -0.0016258955001831055, -0.0015625804662704468, -0.001499265432357788, -0.0014359503984451294, -0.0013726353645324707, -0.001309320330619812, -0.0012460052967071533, -0.0011826902627944946, -0.001119375228881836, -0.0010560601949691772, -0.0009927451610565186, -0.0009294301271438599, -0.0008661150932312012, -0.0008028000593185425, -0.0007394850254058838, -0.0006761699914932251, -0.0006128549575805664, -0.0005495399236679077, -0.000486224889755249, -0.00042290985584259033, -0.00035959482192993164, -0.00029627978801727295, -0.00023296475410461426, -0.00016964972019195557, -0.00010633468627929688, -4.3019652366638184e-05, 2.0295381546020508e-05, 8.36104154586792e-05, 0.0001469254493713379, 0.00021024048328399658, 0.0002735555171966553, 0.00033687055110931396, 0.00040018558502197266, 0.00046350061893463135, 0.00052681565284729, 0.0005901306867599487, 0.0006534457206726074, 0.0007167607545852661, 0.0007800757884979248, 0.0008433908224105835, 0.0009067058563232422, 0.0009700208902359009, 0.0010333359241485596, 0.0010966509580612183, 0.001159965991973877, 0.0012232810258865356, 0.0012865960597991943, 0.001349911093711853, 0.0014132261276245117, 0.0014765411615371704, 0.001539856195449829, 0.0016031712293624878, 0.0016664862632751465, 0.0017298012971878052, 0.0017931163311004639, 0.0018564313650131226, 0.0019197463989257812]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 5.0, 3.0, 3.0, 6.0, 5.0, 5.0, 6.0, 9.0, 16.0, 24.0, 36.0, 58.0, 73.0, 105.0, 149.0, 263.0, 481.0, 775.0, 1362.0, 2263.0, 4358.0, 7940.0, 16706.0, 39964.0, 136002.0, 636576.0, 128188.0, 39055.0, 16198.0, 8127.0, 4243.0, 2250.0, 1282.0, 777.0, 459.0, 276.0, 167.0, 126.0, 74.0, 57.0, 48.0, 16.0, 10.0, 6.0, 1.0, 5.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.96453857421875e-05, -8.626095950603485e-05, -8.28765332698822e-05, -7.949210703372955e-05, -7.61076807975769e-05, -7.272325456142426e-05, -6.93388283252716e-05, -6.595440208911896e-05, -6.256997585296631e-05, -5.918554961681366e-05, -5.580112338066101e-05, -5.241669714450836e-05, -4.903227090835571e-05, -4.5647844672203064e-05, -4.2263418436050415e-05, -3.8878992199897766e-05, -3.549456596374512e-05, -3.211013972759247e-05, -2.872571349143982e-05, -2.534128725528717e-05, -2.195686101913452e-05, -1.8572434782981873e-05, -1.5188008546829224e-05, -1.1803582310676575e-05, -8.419156074523926e-06, -5.034729838371277e-06, -1.650303602218628e-06, 1.734122633934021e-06, 5.11854887008667e-06, 8.502975106239319e-06, 1.1887401342391968e-05, 1.5271827578544617e-05, 1.8656253814697266e-05, 2.2040680050849915e-05, 2.5425106287002563e-05, 2.8809532523155212e-05, 3.219395875930786e-05, 3.557838499546051e-05, 3.896281123161316e-05, 4.234723746776581e-05, 4.573166370391846e-05, 4.9116089940071106e-05, 5.2500516176223755e-05, 5.5884942412376404e-05, 5.926936864852905e-05, 6.26537948846817e-05, 6.603822112083435e-05, 6.9422647356987e-05, 7.280707359313965e-05, 7.61914998292923e-05, 7.957592606544495e-05, 8.29603523015976e-05, 8.634477853775024e-05, 8.972920477390289e-05, 9.311363101005554e-05, 9.649805724620819e-05, 9.988248348236084e-05, 0.00010326690971851349, 0.00010665133595466614, 0.00011003576219081879, 0.00011342018842697144, 0.00011680461466312408, 0.00012018904089927673, 0.00012357346713542938, 0.00012695789337158203]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 0.0, 1.0, 3.0, 9.0, 7.0, 13.0, 15.0, 0.0, 17.0, 13.0, 21.0, 32.0, 27.0, 38.0, 0.0, 41.0, 45.0, 39.0, 59.0, 44.0, 57.0, 0.0, 51.0, 53.0, 57.0, 45.0, 33.0, 42.0, 0.0, 42.0, 41.0, 22.0, 25.0, 23.0, 16.0, 0.0, 20.0, 9.0, 10.0, 13.0, 8.0, 1.0, 0.0, 9.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.4901161193847656e-06, -1.4388933777809143e-06, -1.387670636177063e-06, -1.3364478945732117e-06, -1.2852251529693604e-06, -1.234002411365509e-06, -1.1827796697616577e-06, -1.1315569281578064e-06, -1.080334186553955e-06, -1.0291114449501038e-06, -9.778887033462524e-07, -9.266659617424011e-07, -8.754432201385498e-07, -8.242204785346985e-07, -7.729977369308472e-07, -7.217749953269958e-07, -6.705522537231445e-07, -6.193295121192932e-07, -5.681067705154419e-07, -5.168840289115906e-07, -4.6566128730773926e-07, -4.1443854570388794e-07, -3.632158041000366e-07, -3.119930624961853e-07, -2.60770320892334e-07, -2.0954757928848267e-07, -1.5832483768463135e-07, -1.0710209608078003e-07, -5.587935447692871e-08, -4.6566128730773926e-09, 4.6566128730773926e-08, 9.778887033462524e-08, 1.4901161193847656e-07, 2.0023435354232788e-07, 2.514570951461792e-07, 3.026798367500305e-07, 3.5390257835388184e-07, 4.0512531995773315e-07, 4.5634806156158447e-07, 5.075708031654358e-07, 5.587935447692871e-07, 6.100162863731384e-07, 6.612390279769897e-07, 7.124617695808411e-07, 7.636845111846924e-07, 8.149072527885437e-07, 8.66129994392395e-07, 9.173527359962463e-07, 9.685754776000977e-07, 1.019798219203949e-06, 1.0710209608078003e-06, 1.1222437024116516e-06, 1.173466444015503e-06, 1.2246891856193542e-06, 1.2759119272232056e-06, 1.3271346688270569e-06, 1.3783574104309082e-06, 1.4295801520347595e-06, 1.4808028936386108e-06, 1.5320256352424622e-06, 1.5832483768463135e-06, 1.6344711184501648e-06, 1.6856938600540161e-06, 1.7369166016578674e-06, 1.7881393432617188e-06]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 5.0, 3.0, 14.0, 20.0, 20.0, 39.0, 58.0, 58.0, 110.0, 146.0, 229.0, 328.0, 435.0, 677.0, 1020.0, 1594.0, 2362.0, 3597.0, 5988.0, 9604.0, 16779.0, 30023.0, 60205.0, 139807.0, 446950.0, 174075.0, 71466.0, 34966.0, 18818.0, 10728.0, 6568.0, 4082.0, 2645.0, 1696.0, 1114.0, 712.0, 515.0, 342.0, 245.0, 157.0, 107.0, 72.0, 63.0, 36.0, 29.0, 17.0, 12.0, 11.0, 5.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00012183189392089844, -0.00011785142123699188, -0.00011387094855308533, -0.00010989047586917877, -0.00010591000318527222, -0.00010192953050136566, -9.79490578174591e-05, -9.396858513355255e-05, -8.9988112449646e-05, -8.600763976573944e-05, -8.202716708183289e-05, -7.804669439792633e-05, -7.406622171401978e-05, -7.008574903011322e-05, -6.610527634620667e-05, -6.212480366230011e-05, -5.8144330978393555e-05, -5.4163858294487e-05, -5.0183385610580444e-05, -4.620291292667389e-05, -4.2222440242767334e-05, -3.824196755886078e-05, -3.4261494874954224e-05, -3.028102219104767e-05, -2.6300549507141113e-05, -2.2320076823234558e-05, -1.8339604139328003e-05, -1.4359131455421448e-05, -1.0378658771514893e-05, -6.398186087608337e-06, -2.4177134037017822e-06, 1.562759280204773e-06, 5.543231964111328e-06, 9.523704648017883e-06, 1.3504177331924438e-05, 1.7484650015830994e-05, 2.146512269973755e-05, 2.5445595383644104e-05, 2.942606806755066e-05, 3.3406540751457214e-05, 3.738701343536377e-05, 4.1367486119270325e-05, 4.534795880317688e-05, 4.9328431487083435e-05, 5.330890417098999e-05, 5.7289376854896545e-05, 6.12698495388031e-05, 6.525032222270966e-05, 6.923079490661621e-05, 7.321126759052277e-05, 7.719174027442932e-05, 8.117221295833588e-05, 8.515268564224243e-05, 8.913315832614899e-05, 9.311363101005554e-05, 9.70941036939621e-05, 0.00010107457637786865, 0.00010505504906177521, 0.00010903552174568176, 0.00011301599442958832, 0.00011699646711349487, 0.00012097693979740143, 0.00012495741248130798, 0.00012893788516521454, 0.0001329183578491211]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 5.0, 5.0, 9.0, 5.0, 6.0, 10.0, 9.0, 9.0, 12.0, 15.0, 17.0, 17.0, 18.0, 17.0, 36.0, 49.0, 45.0, 48.0, 47.0, 108.0, 144.0, 64.0, 40.0, 46.0, 34.0, 30.0, 21.0, 16.0, 23.0, 8.0, 14.0, 10.0, 11.0, 13.0, 2.0, 5.0, 8.0, 4.0, 7.0, 2.0, 7.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.719329833984375e-05, -3.603566437959671e-05, -3.487803041934967e-05, -3.372039645910263e-05, -3.256276249885559e-05, -3.140512853860855e-05, -3.024749457836151e-05, -2.908986061811447e-05, -2.793222665786743e-05, -2.6774592697620392e-05, -2.5616958737373352e-05, -2.4459324777126312e-05, -2.3301690816879272e-05, -2.2144056856632233e-05, -2.0986422896385193e-05, -1.9828788936138153e-05, -1.8671154975891113e-05, -1.7513521015644073e-05, -1.6355887055397034e-05, -1.5198253095149994e-05, -1.4040619134902954e-05, -1.2882985174655914e-05, -1.1725351214408875e-05, -1.0567717254161835e-05, -9.410083293914795e-06, -8.252449333667755e-06, -7.094815373420715e-06, -5.9371814131736755e-06, -4.779547452926636e-06, -3.621913492679596e-06, -2.464279532432556e-06, -1.3066455721855164e-06, -1.4901161193847656e-07, 1.0086223483085632e-06, 2.166256308555603e-06, 3.323890268802643e-06, 4.481524229049683e-06, 5.639158189296722e-06, 6.796792149543762e-06, 7.954426109790802e-06, 9.112060070037842e-06, 1.0269694030284882e-05, 1.1427327990531921e-05, 1.2584961950778961e-05, 1.3742595911026001e-05, 1.490022987127304e-05, 1.605786383152008e-05, 1.721549779176712e-05, 1.837313175201416e-05, 1.95307657122612e-05, 2.068839967250824e-05, 2.184603363275528e-05, 2.300366759300232e-05, 2.416130155324936e-05, 2.53189355134964e-05, 2.647656947374344e-05, 2.763420343399048e-05, 2.879183739423752e-05, 2.9949471354484558e-05, 3.11071053147316e-05, 3.226473927497864e-05, 3.342237323522568e-05, 3.458000719547272e-05, 3.573764115571976e-05, 3.68952751159668e-05]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 2.0, 5.0, 6.0, 4.0, 5.0, 17.0, 15.0, 18.0, 26.0, 32.0, 51.0, 50.0, 70.0, 92.0, 117.0, 104.0, 81.0, 73.0, 58.0, 23.0, 28.0, 17.0, 20.0, 12.0, 12.0, 16.0, 14.0, 6.0, 5.0, 4.0, 1.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00554812652990222, -0.005393202416598797, -0.005238277837634087, -0.005083353724330664, -0.004928429611027241, -0.004773505497723818, -0.004618581384420395, -0.004463656805455685, -0.004308732692152262, -0.004153808578848839, -0.003998883999884129, -0.0038439598865807056, -0.0036890357732772827, -0.00353411165997386, -0.003379187313839793, -0.0032242629677057266, -0.0030693388544023037, -0.0029144147410988808, -0.002759490394964814, -0.0026045660488307476, -0.0024496419355273247, -0.0022947178222239017, -0.002139793476089835, -0.0019848691299557686, -0.0018299450166523457, -0.001675020786933601, -0.0015200965572148561, -0.0013651723274961114, -0.0012102480977773666, -0.0010553238680586219, -0.0009003996383398771, -0.0007454754086211324, -0.0005905507132411003, -0.00043562648352235556, -0.0002807022538036108, -0.00012577802408486605, 2.9146205633878708e-05, 0.00018407043535262346, 0.0003389946650713682, 0.000493918894790113, 0.0006488431245088577, 0.0008037673542276025, 0.0009586915839463472, 0.001113615813665092, 0.0012685400433838367, 0.0014234642731025815, 0.0015783885028213263, 0.001733312732540071, 0.0018882369622588158, 0.0020431610755622387, 0.0021980854216963053, 0.002353009767830372, 0.002507933881133795, 0.0026628579944372177, 0.0028177823405712843, 0.002972706686705351, 0.003127630800008774, 0.0032825549133121967, 0.0034374792594462633, 0.00359240360558033, 0.003747327718883753, 0.0039022518321871758, 0.004057176411151886, 0.004212100524455309, 0.004367024637758732]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 5.0, 5.0, 8.0, 11.0, 9.0, 14.0, 21.0, 19.0, 20.0, 27.0, 24.0, 51.0, 41.0, 42.0, 25.0, 62.0, 42.0, 46.0, 43.0, 32.0, 35.0, 44.0, 37.0, 54.0, 37.0, 32.0, 34.0, 24.0, 28.0, 19.0, 17.0, 15.0, 18.0, 17.0, 12.0, 6.0, 5.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.003887579310685396, -0.0037686608266085386, -0.003649742342531681, -0.0035308238584548235, -0.003411905374377966, -0.003292987123131752, -0.0031740686390548944, -0.003055150154978037, -0.0029362316709011793, -0.0028173131868243217, -0.002698394702747464, -0.0025794762186706066, -0.0024605579674243927, -0.0023416392505168915, -0.0022227209992706776, -0.00210380251519382, -0.0019848840311169624, -0.0018659655470401049, -0.0017470470629632473, -0.0016281286953017116, -0.001509210211224854, -0.0013902917271479964, -0.0012713733594864607, -0.0011524548754096031, -0.0010335363913327456, -0.000914617907255888, -0.0007956994813866913, -0.0006767810555174947, -0.0005578625714406371, -0.00043894408736377954, -0.0003200256614945829, -0.00020110723562538624, -8.218851871788502e-05, 3.672993625514209e-05, 0.0001556483912281692, 0.0002745668462011963, 0.0003934853011742234, 0.000512403785251081, 0.0006313222111202776, 0.0007502406369894743, 0.0008691591210663319, 0.0009880776051431894, 0.001106996089220047, 0.0012259144568815827, 0.0013448329409584403, 0.0014637514250352979, 0.0015826697926968336, 0.0017015882767736912, 0.0018205067608505487, 0.0019394252449274063, 0.002058343729004264, 0.0021772622130811214, 0.0022961804643273354, 0.0024150991812348366, 0.0025340174324810505, 0.002652935916557908, 0.0027718544006347656, 0.002890772884711623, 0.0030096913687884808, 0.0031286098528653383, 0.003247528336942196, 0.00336644658818841, 0.0034853650722652674, 0.003604283556342125, 0.0037232020404189825]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 7.0, 4.0, 7.0, 5.0, 12.0, 18.0, 23.0, 44.0, 54.0, 92.0, 138.0, 180.0, 289.0, 402.0, 605.0, 858.0, 1259.0, 1915.0, 2935.0, 4739.0, 7423.0, 11897.0, 19246.0, 32324.0, 59172.0, 115623.0, 228477.0, 256246.0, 138547.0, 69661.0, 37745.0, 21876.0, 13332.0, 8120.0, 5267.0, 3432.0, 2182.0, 1432.0, 975.0, 650.0, 409.0, 278.0, 205.0, 123.0, 102.0, 62.0, 51.0, 38.0, 25.0, 25.0, 12.0, 9.0, 6.0, 4.0, 2.0, 2.0, 1.0], "bins": [-0.00835418701171875, -0.00810939073562622, -0.007864594459533691, -0.007619798183441162, -0.007375001907348633, -0.0071302056312561035, -0.006885409355163574, -0.006640613079071045, -0.006395816802978516, -0.006151020526885986, -0.005906224250793457, -0.005661427974700928, -0.0054166316986083984, -0.005171835422515869, -0.00492703914642334, -0.0046822428703308105, -0.004437446594238281, -0.004192650318145752, -0.003947854042053223, -0.0037030577659606934, -0.003458261489868164, -0.0032134652137756348, -0.0029686689376831055, -0.002723872661590576, -0.002479076385498047, -0.0022342801094055176, -0.0019894838333129883, -0.001744687557220459, -0.0014998912811279297, -0.0012550950050354004, -0.001010298728942871, -0.0007655024528503418, -0.0005207061767578125, -0.0002759099006652832, -3.1113624572753906e-05, 0.0002136826515197754, 0.0004584789276123047, 0.000703275203704834, 0.0009480714797973633, 0.0011928677558898926, 0.0014376640319824219, 0.0016824603080749512, 0.0019272565841674805, 0.0021720528602600098, 0.002416849136352539, 0.0026616454124450684, 0.0029064416885375977, 0.003151237964630127, 0.0033960342407226562, 0.0036408305168151855, 0.003885626792907715, 0.004130423069000244, 0.0043752193450927734, 0.004620015621185303, 0.004864811897277832, 0.005109608173370361, 0.005354404449462891, 0.00559920072555542, 0.005843997001647949, 0.0060887932777404785, 0.006333589553833008, 0.006578385829925537, 0.006823182106018066, 0.007067978382110596, 0.007312774658203125]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 5.0, 10.0, 11.0, 7.0, 15.0, 18.0, 18.0, 20.0, 28.0, 29.0, 37.0, 48.0, 33.0, 35.0, 45.0, 45.0, 47.0, 38.0, 38.0, 30.0, 54.0, 51.0, 31.0, 46.0, 42.0, 31.0, 31.0, 27.0, 18.0, 15.0, 18.0, 15.0, 7.0, 15.0, 11.0, 11.0, 1.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0032596588134765625, -0.0031508803367614746, -0.0030421018600463867, -0.002933323383331299, -0.002824544906616211, -0.002715766429901123, -0.002606987953186035, -0.0024982094764709473, -0.0023894309997558594, -0.0022806525230407715, -0.0021718740463256836, -0.0020630955696105957, -0.001954317092895508, -0.00184553861618042, -0.001736760139465332, -0.0016279816627502441, -0.0015192031860351562, -0.0014104247093200684, -0.0013016462326049805, -0.0011928677558898926, -0.0010840892791748047, -0.0009753108024597168, -0.0008665323257446289, -0.000757753849029541, -0.0006489753723144531, -0.0005401968955993652, -0.00043141841888427734, -0.00032263994216918945, -0.00021386146545410156, -0.00010508298873901367, 3.6954879760742188e-06, 0.00011247396469116211, 0.00022125244140625, 0.0003300309181213379, 0.0004388093948364258, 0.0005475878715515137, 0.0006563663482666016, 0.0007651448249816895, 0.0008739233016967773, 0.0009827017784118652, 0.0010914802551269531, 0.001200258731842041, 0.001309037208557129, 0.0014178156852722168, 0.0015265941619873047, 0.0016353726387023926, 0.0017441511154174805, 0.0018529295921325684, 0.0019617080688476562, 0.002070486545562744, 0.002179265022277832, 0.00228804349899292, 0.002396821975708008, 0.0025056004524230957, 0.0026143789291381836, 0.0027231574058532715, 0.0028319358825683594, 0.0029407143592834473, 0.003049492835998535, 0.003158271312713623, 0.003267049789428711, 0.003375828266143799, 0.0034846067428588867, 0.0035933852195739746, 0.0037021636962890625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 10.0, 14.0, 18.0, 19.0, 38.0, 53.0, 75.0, 110.0, 165.0, 207.0, 325.0, 500.0, 764.0, 1169.0, 1557.0, 2361.0, 3489.0, 5090.0, 7556.0, 11729.0, 18158.0, 28500.0, 46377.0, 79106.0, 151581.0, 293116.0, 171978.0, 86350.0, 50392.0, 30684.0, 19480.0, 12429.0, 8241.0, 5537.0, 3707.0, 2461.0, 1557.0, 1171.0, 821.0, 523.0, 363.0, 244.0, 194.0, 122.0, 80.0, 56.0, 30.0, 18.0, 12.0, 11.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.007144927978515625, -0.006918668746948242, -0.006692409515380859, -0.0064661502838134766, -0.006239891052246094, -0.006013631820678711, -0.005787372589111328, -0.005561113357543945, -0.0053348541259765625, -0.00510859489440918, -0.004882335662841797, -0.004656076431274414, -0.004429817199707031, -0.0042035579681396484, -0.003977298736572266, -0.003751039505004883, -0.0035247802734375, -0.003298521041870117, -0.0030722618103027344, -0.0028460025787353516, -0.0026197433471679688, -0.002393484115600586, -0.002167224884033203, -0.0019409656524658203, -0.0017147064208984375, -0.0014884471893310547, -0.0012621879577636719, -0.001035928726196289, -0.0008096694946289062, -0.0005834102630615234, -0.0003571510314941406, -0.0001308917999267578, 9.5367431640625e-05, 0.0003216266632080078, 0.0005478858947753906, 0.0007741451263427734, 0.0010004043579101562, 0.001226663589477539, 0.0014529228210449219, 0.0016791820526123047, 0.0019054412841796875, 0.0021317005157470703, 0.002357959747314453, 0.002584218978881836, 0.0028104782104492188, 0.0030367374420166016, 0.0032629966735839844, 0.003489255905151367, 0.00371551513671875, 0.003941774368286133, 0.004168033599853516, 0.0043942928314208984, 0.004620552062988281, 0.004846811294555664, 0.005073070526123047, 0.00529932975769043, 0.0055255889892578125, 0.005751848220825195, 0.005978107452392578, 0.006204366683959961, 0.006430625915527344, 0.0066568851470947266, 0.006883144378662109, 0.007109403610229492, 0.007335662841796875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 5.0, 7.0, 9.0, 8.0, 8.0, 14.0, 20.0, 17.0, 9.0, 20.0, 21.0, 29.0, 26.0, 30.0, 32.0, 34.0, 32.0, 32.0, 38.0, 38.0, 36.0, 39.0, 51.0, 33.0, 41.0, 39.0, 44.0, 37.0, 26.0, 31.0, 24.0, 21.0, 24.0, 22.0, 19.0, 17.0, 10.0, 10.0, 5.0, 13.0, 5.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017824172973632812, -0.0017190128564834595, -0.0016556084156036377, -0.001592203974723816, -0.0015287995338439941, -0.0014653950929641724, -0.0014019906520843506, -0.0013385862112045288, -0.001275181770324707, -0.0012117773294448853, -0.0011483728885650635, -0.0010849684476852417, -0.00102156400680542, -0.0009581595659255981, -0.0008947551250457764, -0.0008313506841659546, -0.0007679462432861328, -0.000704541802406311, -0.0006411373615264893, -0.0005777329206466675, -0.0005143284797668457, -0.0004509240388870239, -0.00038751959800720215, -0.00032411515712738037, -0.0002607107162475586, -0.00019730627536773682, -0.00013390183448791504, -7.049739360809326e-05, -7.092952728271484e-06, 5.631148815155029e-05, 0.00011971592903137207, 0.00018312036991119385, 0.0002465248107910156, 0.0003099292516708374, 0.0003733336925506592, 0.00043673813343048096, 0.0005001425743103027, 0.0005635470151901245, 0.0006269514560699463, 0.0006903558969497681, 0.0007537603378295898, 0.0008171647787094116, 0.0008805692195892334, 0.0009439736604690552, 0.001007378101348877, 0.0010707825422286987, 0.0011341869831085205, 0.0011975914239883423, 0.001260995864868164, 0.0013244003057479858, 0.0013878047466278076, 0.0014512091875076294, 0.0015146136283874512, 0.001578018069267273, 0.0016414225101470947, 0.0017048269510269165, 0.0017682313919067383, 0.00183163583278656, 0.0018950402736663818, 0.0019584447145462036, 0.0020218491554260254, 0.002085253596305847, 0.002148658037185669, 0.0022120624780654907, 0.0022754669189453125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 3.0, 7.0, 9.0, 7.0, 16.0, 17.0, 35.0, 55.0, 62.0, 94.0, 173.0, 292.0, 512.0, 900.0, 1533.0, 2941.0, 5519.0, 11256.0, 25029.0, 63496.0, 195928.0, 423824.0, 202344.0, 65236.0, 25459.0, 11554.0, 5563.0, 2922.0, 1629.0, 857.0, 495.0, 301.0, 175.0, 100.0, 65.0, 47.0, 30.0, 20.0, 14.0, 13.0, 13.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005741119384765625, -0.000556454062461853, -0.0005387961864471436, -0.0005211383104324341, -0.0005034804344177246, -0.00048582255840301514, -0.00046816468238830566, -0.0004505068063735962, -0.0004328489303588867, -0.00041519105434417725, -0.0003975331783294678, -0.0003798753023147583, -0.00036221742630004883, -0.00034455955028533936, -0.0003269016742706299, -0.0003092437982559204, -0.00029158592224121094, -0.00027392804622650146, -0.000256270170211792, -0.00023861229419708252, -0.00022095441818237305, -0.00020329654216766357, -0.0001856386661529541, -0.00016798079013824463, -0.00015032291412353516, -0.00013266503810882568, -0.00011500716209411621, -9.734928607940674e-05, -7.969141006469727e-05, -6.203353404998779e-05, -4.437565803527832e-05, -2.6717782020568848e-05, -9.059906005859375e-06, 8.597970008850098e-06, 2.625584602355957e-05, 4.391372203826904e-05, 6.157159805297852e-05, 7.922947406768799e-05, 9.688735008239746e-05, 0.00011454522609710693, 0.0001322031021118164, 0.00014986097812652588, 0.00016751885414123535, 0.00018517673015594482, 0.0002028346061706543, 0.00022049248218536377, 0.00023815035820007324, 0.0002558082342147827, 0.0002734661102294922, 0.00029112398624420166, 0.00030878186225891113, 0.0003264397382736206, 0.0003440976142883301, 0.00036175549030303955, 0.000379413366317749, 0.0003970712423324585, 0.00041472911834716797, 0.00043238699436187744, 0.0004500448703765869, 0.0004677027463912964, 0.00048536062240600586, 0.0005030184984207153, 0.0005206763744354248, 0.0005383342504501343, 0.0005559921264648438]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 8.0, 0.0, 0.0, 17.0, 0.0, 23.0, 0.0, 0.0, 40.0, 0.0, 56.0, 0.0, 0.0, 86.0, 0.0, 109.0, 0.0, 102.0, 0.0, 0.0, 115.0, 0.0, 117.0, 0.0, 0.0, 108.0, 0.0, 80.0, 0.0, 0.0, 50.0, 0.0, 45.0, 0.0, 0.0, 25.0, 0.0, 22.0, 0.0, 0.0, 8.0, 0.0, 6.0, 0.0, 2.0], "bins": [-9.5367431640625e-07, -9.294599294662476e-07, -9.052455425262451e-07, -8.810311555862427e-07, -8.568167686462402e-07, -8.326023817062378e-07, -8.083879947662354e-07, -7.841736078262329e-07, -7.599592208862305e-07, -7.35744833946228e-07, -7.115304470062256e-07, -6.873160600662231e-07, -6.631016731262207e-07, -6.388872861862183e-07, -6.146728992462158e-07, -5.904585123062134e-07, -5.662441253662109e-07, -5.420297384262085e-07, -5.178153514862061e-07, -4.936009645462036e-07, -4.6938657760620117e-07, -4.4517219066619873e-07, -4.209578037261963e-07, -3.9674341678619385e-07, -3.725290298461914e-07, -3.4831464290618896e-07, -3.241002559661865e-07, -2.998858690261841e-07, -2.7567148208618164e-07, -2.514570951461792e-07, -2.2724270820617676e-07, -2.0302832126617432e-07, -1.7881393432617188e-07, -1.5459954738616943e-07, -1.30385160446167e-07, -1.0617077350616455e-07, -8.195638656616211e-08, -5.774199962615967e-08, -3.3527612686157227e-08, -9.313225746154785e-09, 1.4901161193847656e-08, 3.91155481338501e-08, 6.332993507385254e-08, 8.754432201385498e-08, 1.1175870895385742e-07, 1.3597309589385986e-07, 1.601874828338623e-07, 1.8440186977386475e-07, 2.086162567138672e-07, 2.3283064365386963e-07, 2.5704503059387207e-07, 2.812594175338745e-07, 3.0547380447387695e-07, 3.296881914138794e-07, 3.5390257835388184e-07, 3.781169652938843e-07, 4.023313522338867e-07, 4.2654573917388916e-07, 4.507601261138916e-07, 4.7497451305389404e-07, 4.991888999938965e-07, 5.234032869338989e-07, 5.476176738739014e-07, 5.718320608139038e-07, 5.960464477539062e-07]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 3.0, 7.0, 7.0, 13.0, 16.0, 16.0, 27.0, 38.0, 53.0, 77.0, 108.0, 143.0, 219.0, 293.0, 465.0, 649.0, 932.0, 1376.0, 2111.0, 3243.0, 4971.0, 8128.0, 14202.0, 26479.0, 58089.0, 161091.0, 387685.0, 224800.0, 77487.0, 32806.0, 16557.0, 9811.0, 5751.0, 3625.0, 2312.0, 1506.0, 1054.0, 741.0, 477.0, 365.0, 255.0, 153.0, 107.0, 81.0, 79.0, 47.0, 26.0, 27.0, 16.0, 12.0, 11.0, 7.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0004982948303222656, -0.00048203766345977783, -0.00046578049659729004, -0.00044952332973480225, -0.00043326616287231445, -0.00041700899600982666, -0.00040075182914733887, -0.0003844946622848511, -0.0003682374954223633, -0.0003519803285598755, -0.0003357231616973877, -0.0003194659948348999, -0.0003032088279724121, -0.0002869516611099243, -0.0002706944942474365, -0.00025443732738494873, -0.00023818016052246094, -0.00022192299365997314, -0.00020566582679748535, -0.00018940865993499756, -0.00017315149307250977, -0.00015689432621002197, -0.00014063715934753418, -0.0001243799924850464, -0.0001081228256225586, -9.18656587600708e-05, -7.560849189758301e-05, -5.9351325035095215e-05, -4.309415817260742e-05, -2.683699131011963e-05, -1.0579824447631836e-05, 5.677342414855957e-06, 2.193450927734375e-05, 3.819167613983154e-05, 5.4448843002319336e-05, 7.070600986480713e-05, 8.696317672729492e-05, 0.00010322034358978271, 0.00011947751045227051, 0.0001357346773147583, 0.0001519918441772461, 0.0001682490110397339, 0.00018450617790222168, 0.00020076334476470947, 0.00021702051162719727, 0.00023327767848968506, 0.00024953484535217285, 0.00026579201221466064, 0.00028204917907714844, 0.00029830634593963623, 0.000314563512802124, 0.0003308206796646118, 0.0003470778465270996, 0.0003633350133895874, 0.0003795921802520752, 0.000395849347114563, 0.0004121065139770508, 0.0004283636808395386, 0.00044462084770202637, 0.00046087801456451416, 0.00047713518142700195, 0.0004933923482894897, 0.0005096495151519775, 0.0005259066820144653, 0.0005421638488769531]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 8.0, 3.0, 4.0, 6.0, 8.0, 5.0, 17.0, 12.0, 19.0, 17.0, 20.0, 38.0, 44.0, 55.0, 62.0, 87.0, 84.0, 96.0, 80.0, 51.0, 61.0, 46.0, 37.0, 29.0, 31.0, 21.0, 16.0, 17.0, 7.0, 6.0, 7.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013399124145507812, -0.00012954510748386383, -0.00012509897351264954, -0.00012065283954143524, -0.00011620670557022095, -0.00011176057159900665, -0.00010731443762779236, -0.00010286830365657806, -9.842216968536377e-05, -9.397603571414948e-05, -8.952990174293518e-05, -8.508376777172089e-05, -8.063763380050659e-05, -7.61914998292923e-05, -7.1745365858078e-05, -6.729923188686371e-05, -6.285309791564941e-05, -5.840696394443512e-05, -5.3960829973220825e-05, -4.951469600200653e-05, -4.5068562030792236e-05, -4.062242805957794e-05, -3.617629408836365e-05, -3.173016011714935e-05, -2.728402614593506e-05, -2.2837892174720764e-05, -1.839175820350647e-05, -1.3945624232292175e-05, -9.499490261077881e-06, -5.0533562898635864e-06, -6.07222318649292e-07, 3.8389116525650024e-06, 8.285045623779297e-06, 1.2731179594993591e-05, 1.7177313566207886e-05, 2.162344753742218e-05, 2.6069581508636475e-05, 3.051571547985077e-05, 3.4961849451065063e-05, 3.940798342227936e-05, 4.385411739349365e-05, 4.830025136470795e-05, 5.274638533592224e-05, 5.7192519307136536e-05, 6.163865327835083e-05, 6.608478724956512e-05, 7.053092122077942e-05, 7.497705519199371e-05, 7.942318916320801e-05, 8.38693231344223e-05, 8.83154571056366e-05, 9.276159107685089e-05, 9.720772504806519e-05, 0.00010165385901927948, 0.00010609999299049377, 0.00011054612696170807, 0.00011499226093292236, 0.00011943839490413666, 0.00012388452887535095, 0.00012833066284656525, 0.00013277679681777954, 0.00013722293078899384, 0.00014166906476020813, 0.00014611519873142242, 0.00015056133270263672]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 0.0, 4.0, 3.0, 6.0, 9.0, 7.0, 6.0, 6.0, 12.0, 16.0, 21.0, 31.0, 33.0, 46.0, 63.0, 106.0, 137.0, 129.0, 100.0, 74.0, 58.0, 37.0, 18.0, 19.0, 11.0, 15.0, 7.0, 8.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.007868672721087933, -0.007675983943045139, -0.007483294699341059, -0.0072906059212982655, -0.007097917143255472, -0.006905227899551392, -0.006712539121508598, -0.006519850343465805, -0.006327161565423012, -0.0061344727873802185, -0.005941783543676138, -0.005749094765633345, -0.005556405987590551, -0.005363716743886471, -0.0051710279658436775, -0.004978339187800884, -0.004785649944096804, -0.00459296116605401, -0.00440027192234993, -0.0042075831443071365, -0.004014894366264343, -0.0038222053553909063, -0.0036295163445174694, -0.003436827566474676, -0.003244138555601239, -0.0030514495447278023, -0.002858760766685009, -0.002666071755811572, -0.002473382744938135, -0.002280693966895342, -0.002088004956021905, -0.0018953160615637898, -0.0017026271671056747, -0.0015099382726475596, -0.0013172493781894445, -0.0011245603673160076, -0.0009318714728578925, -0.0007391825783997774, -0.0005464935675263405, -0.0003538046730682254, -0.00016111577861011028, 3.1573144951835275e-05, 0.00022426206851378083, 0.00041695102117955685, 0.000609639915637672, 0.000802328810095787, 0.000995017820969224, 0.001187706715427339, 0.0013803956098854542, 0.0015730845043435693, 0.0017657733988016844, 0.0019584624096751213, 0.0021511511877179146, 0.0023438401985913515, 0.0025365292094647884, 0.0027292179875075817, 0.0029219069983810186, 0.0031145960092544556, 0.003307284787297249, 0.0034999737981706858, 0.0036926628090441227, 0.003885351587086916, 0.0040780408307909966, 0.00427072960883379, 0.004463418386876583]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 9.0, 13.0, 21.0, 16.0, 22.0, 32.0, 25.0, 31.0, 46.0, 30.0, 37.0, 51.0, 53.0, 52.0, 47.0, 41.0, 50.0, 52.0, 45.0, 43.0, 38.0, 35.0, 27.0, 32.0, 26.0, 22.0, 17.0, 13.0, 10.0, 12.0, 7.0, 10.0, 5.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0041491747833788395, -0.004014887381345034, -0.003880600444972515, -0.003746313275769353, -0.0036120261065661907, -0.003477738704532385, -0.0033434515353292227, -0.0032091643661260605, -0.0030748771969228983, -0.002940590027719736, -0.002806302858516574, -0.0026720156893134117, -0.002537728287279606, -0.0024034413509070873, -0.0022691539488732815, -0.0021348667796701193, -0.002000579610466957, -0.001866292441263795, -0.0017320052720606327, -0.0015977179864421487, -0.0014634308172389865, -0.0013291436480358243, -0.0011948563624173403, -0.001060569193214178, -0.0009262820240110159, -0.0007919948548078537, -0.0006577076273970306, -0.0005234203999862075, -0.0003891332307830453, -0.0002548460615798831, -0.00012055883416905999, 1.3728393241763115e-05, 0.000148015096783638, 0.00028230229509063065, 0.0004165894933976233, 0.0005508767208084464, 0.0006851638900116086, 0.0008194510592147708, 0.0009537382866255939, 0.001088025514036417, 0.0012223126832395792, 0.0013565998524427414, 0.0014908870216459036, 0.0016251743072643876, 0.0017594614764675498, 0.001893748645670712, 0.002028035931289196, 0.002162323100492358, 0.0022966102696955204, 0.0024308974388986826, 0.002565184608101845, 0.002699471777305007, 0.002833758946508169, 0.002968046348541975, 0.003102333517745137, 0.0032366206869482994, 0.0033709078561514616, 0.003505195025354624, 0.003639482194557786, 0.003773769363760948, 0.003908056765794754, 0.004042343702167273, 0.004176631104201078, 0.004310918040573597, 0.004445205442607403]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 2.0, 4.0, 2.0, 4.0, 5.0, 2.0, 18.0, 17.0, 18.0, 16.0, 33.0, 24.0, 23.0, 37.0, 35.0, 54.0, 48.0, 57.0, 277.0, 3549.0, 519139.0, 465.0, 73.0, 51.0, 48.0, 28.0, 46.0, 35.0, 29.0, 21.0, 16.0, 20.0, 15.0, 12.0, 8.0, 12.0, 8.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11199209839105606, -0.10827292501926422, -0.10455375909805298, -0.10083458572626114, -0.0971154123544693, -0.09339624643325806, -0.08967707306146622, -0.08595789968967438, -0.08223873376846313, -0.0785195603966713, -0.07480039447546005, -0.07108122110366821, -0.06736205518245697, -0.06364288181066513, -0.05992370843887329, -0.05620453879237175, -0.05248536914587021, -0.04876619949936867, -0.045047029852867126, -0.04132785648107529, -0.037608686834573746, -0.033889517188072205, -0.030170345678925514, -0.026451174169778824, -0.022732004523277283, -0.01901283487677574, -0.015293663367629051, -0.011574492789804935, -0.00785532221198082, -0.0041361525654792786, -0.0004169810563325882, 0.003302190452814102, 0.007021352648735046, 0.010740523226559162, 0.014459693804383278, 0.018178865313529968, 0.02189803496003151, 0.02561720460653305, 0.02933637611567974, 0.03305554762482643, 0.03677471727132797, 0.040493886917829514, 0.044213056564331055, 0.047932229936122894, 0.051651399582624435, 0.05537056922912598, 0.059089742600917816, 0.06280891597270966, 0.0665280818939209, 0.07024725526571274, 0.07396642118692398, 0.07768559455871582, 0.08140476047992706, 0.0851239338517189, 0.08884310722351074, 0.09256227314472198, 0.09628144651651382, 0.10000061988830566, 0.1037197858095169, 0.10743895918130875, 0.11115813255310059, 0.11487729847431183, 0.11859647184610367, 0.12231564521789551, 0.12603481113910675]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 3.0, 5.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 10.0, 12.0, 21.0, 17.0, 22.0, 30.0, 26.0, 32.0, 45.0, 31.0, 39.0, 51.0, 51.0, 52.0, 1071.0, 42.0, 48.0, 53.0, 46.0, 45.0, 36.0, 35.0, 26.0, 31.0, 26.0, 24.0, 17.0, 12.0, 9.0, 13.0, 7.0, 10.0, 5.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11969549208879471, -0.11583179235458374, -0.11196809262037277, -0.1081043928861618, -0.10424069315195084, -0.10037699341773987, -0.0965132936835289, -0.09264959394931793, -0.08878589421510696, -0.084922194480896, -0.08105849474668503, -0.07719479501247406, -0.07333109527826309, -0.06946739554405212, -0.06560369580984116, -0.06173999607563019, -0.05787629634141922, -0.05401259660720825, -0.050148896872997284, -0.046285197138786316, -0.04242149740457535, -0.03855779767036438, -0.03469409793615341, -0.030830398201942444, -0.026966698467731476, -0.023102998733520508, -0.01923929899930954, -0.015375599265098572, -0.011511899530887604, -0.007648199796676636, -0.0037845000624656677, 7.919967174530029e-05, 0.003942891955375671, 0.007806591689586639, 0.011670291423797607, 0.015533991158008575, 0.019397690892219543, 0.02326139062643051, 0.02712509036064148, 0.030988790094852448, 0.034852489829063416, 0.038716189563274384, 0.04257988929748535, 0.04644358903169632, 0.05030728876590729, 0.054170988500118256, 0.058034688234329224, 0.06189838796854019, 0.06576208770275116, 0.06962578743696213, 0.0734894871711731, 0.07735318690538406, 0.08121688663959503, 0.085080586373806, 0.08894428610801697, 0.09280798584222794, 0.0966716855764389, 0.10053538531064987, 0.10439908504486084, 0.10826278477907181, 0.11212648451328278, 0.11599018424749374, 0.11985388398170471, 0.12371758371591568, 0.12758128345012665]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 2.0, 2.0, 3.0, 7.0, 3.0, 4.0, 4.0, 5.0, 9.0, 5.0, 6.0, 14.0, 10.0, 5.0, 16.0, 12.0, 18.0, 17.0, 17.0, 35.0, 76.0, 119.0, 162.0, 222.0, 331.0, 487.0, 668.0, 885.0, 1006.0, 1519.0, 1607.0, 3422.0, 16147.0, 31200628.0, 10509.0, 13964.0, 849.0, 648.0, 207.0, 177.0, 542.0, 54.0, 26.0, 19.0, 14.0, 7.0, 6.0, 4.0, 3.0, 0.0, 1.0], "bins": [-11776.0, -11521.625, -11267.25, -11012.875, -10758.5, -10504.125, -10249.75, -9995.375, -9741.0, -9486.625, -9232.25, -8977.875, -8723.5, -8469.125, -8214.75, -7960.375, -7706.0, -7451.625, -7197.25, -6942.875, -6688.5, -6434.125, -6179.75, -5925.375, -5671.0, -5416.625, -5162.25, -4907.875, -4653.5, -4399.125, -4144.75, -3890.375, -3636.0, -3381.625, -3127.25, -2872.875, -2618.5, -2364.125, -2109.75, -1855.375, -1601.0, -1346.625, -1092.25, -837.875, -583.5, -329.125, -74.75, 179.625, 434.0, 688.375, 942.75, 1197.125, 1451.5, 1705.875, 1960.25, 2214.625, 2469.0, 2723.375, 2977.75, 3232.125, 3486.5, 3740.875, 3995.25, 4249.625, 4504.0]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 2.0, 6.0, 5.0, 3.0, 6.0, 17.0, 8.0, 20.0, 33.0, 30.0, 57.0, 51.0, 80.0, 131.0, 177.0, 286.0, 480.0, 769.0, 1214.0, 1955.0, 3301.0, 6538.0, 13756.0, 30146.0, 78654.0, 235937.0, 1131647.0, 4184934.0, 401598.0, 118520.0, 43318.0, 18235.0, 8435.0, 4482.0, 2608.0, 1418.0, 813.0, 533.0, 364.0, 242.0, 167.0, 138.0, 83.0, 76.0, 42.0, 36.0, 24.0, 18.0, 7.0, 8.0, 5.0, 3.0, 4.0, 10.0, 3.0, 3.0, 7.0, 0.0, 2.0, 1.0], "bins": [-20.65625, -19.994384765625, -19.33251953125, -18.670654296875, -18.0087890625, -17.346923828125, -16.68505859375, -16.023193359375, -15.361328125, -14.699462890625, -14.03759765625, -13.375732421875, -12.7138671875, -12.052001953125, -11.39013671875, -10.728271484375, -10.06640625, -9.404541015625, -8.74267578125, -8.080810546875, -7.4189453125, -6.757080078125, -6.09521484375, -5.433349609375, -4.771484375, -4.109619140625, -3.44775390625, -2.785888671875, -2.1240234375, -1.462158203125, -0.80029296875, -0.138427734375, 0.5234375, 1.185302734375, 1.84716796875, 2.509033203125, 3.1708984375, 3.832763671875, 4.49462890625, 5.156494140625, 5.818359375, 6.480224609375, 7.14208984375, 7.803955078125, 8.4658203125, 9.127685546875, 9.78955078125, 10.451416015625, 11.11328125, 11.775146484375, 12.43701171875, 13.098876953125, 13.7607421875, 14.422607421875, 15.08447265625, 15.746337890625, 16.408203125, 17.070068359375, 17.73193359375, 18.393798828125, 19.0556640625, 19.717529296875, 20.37939453125, 21.041259765625, 21.703125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 4.0, 10.0, 6.0, 14.0, 13.0, 12.0, 20.0, 17.0, 23.0, 23.0, 39.0, 35.0, 30.0, 45.0, 46.0, 62.0, 76.0, 98.0, 227.0, 537.0, 204.0, 90.0, 55.0, 44.0, 24.0, 37.0, 34.0, 34.0, 32.0, 28.0, 22.0, 13.0, 15.0, 10.0, 8.0, 10.0, 8.0, 5.0, 7.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.84375, -24.100830078125, -23.35791015625, -22.614990234375, -21.8720703125, -21.129150390625, -20.38623046875, -19.643310546875, -18.900390625, -18.157470703125, -17.41455078125, -16.671630859375, -15.9287109375, -15.185791015625, -14.44287109375, -13.699951171875, -12.95703125, -12.214111328125, -11.47119140625, -10.728271484375, -9.9853515625, -9.242431640625, -8.49951171875, -7.756591796875, -7.013671875, -6.270751953125, -5.52783203125, -4.784912109375, -4.0419921875, -3.299072265625, -2.55615234375, -1.813232421875, -1.0703125, -0.327392578125, 0.41552734375, 1.158447265625, 1.9013671875, 2.644287109375, 3.38720703125, 4.130126953125, 4.873046875, 5.615966796875, 6.35888671875, 7.101806640625, 7.8447265625, 8.587646484375, 9.33056640625, 10.073486328125, 10.81640625, 11.559326171875, 12.30224609375, 13.045166015625, 13.7880859375, 14.531005859375, 15.27392578125, 16.016845703125, 16.759765625, 17.502685546875, 18.24560546875, 18.988525390625, 19.7314453125, 20.474365234375, 21.21728515625, 21.960205078125, 22.703125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 6.0, 12.0, 2.0, 1.0, 8.0, 7.0, 13.0, 11.0, 19.0, 28.0, 44.0, 55.0, 85.0, 115.0, 205.0, 224.0, 348.0, 543.0, 820.0, 1212.0, 1829.0, 2859.0, 4467.0, 7381.0, 12391.0, 20542.0, 36133.0, 67696.0, 131362.0, 287251.0, 868090.0, 3790678.0, 589799.0, 227985.0, 106707.0, 55542.0, 30517.0, 17865.0, 10446.0, 6701.0, 4035.0, 2497.0, 1608.0, 1126.0, 726.0, 486.0, 303.0, 183.0, 155.0, 97.0, 66.0, 48.0, 46.0, 30.0, 10.0, 8.0, 8.0, 7.0, 3.0, 5.0, 2.0, 4.0], "bins": [-12.140625, -11.776611328125, -11.41259765625, -11.048583984375, -10.6845703125, -10.320556640625, -9.95654296875, -9.592529296875, -9.228515625, -8.864501953125, -8.50048828125, -8.136474609375, -7.7724609375, -7.408447265625, -7.04443359375, -6.680419921875, -6.31640625, -5.952392578125, -5.58837890625, -5.224365234375, -4.8603515625, -4.496337890625, -4.13232421875, -3.768310546875, -3.404296875, -3.040283203125, -2.67626953125, -2.312255859375, -1.9482421875, -1.584228515625, -1.22021484375, -0.856201171875, -0.4921875, -0.128173828125, 0.23583984375, 0.599853515625, 0.9638671875, 1.327880859375, 1.69189453125, 2.055908203125, 2.419921875, 2.783935546875, 3.14794921875, 3.511962890625, 3.8759765625, 4.239990234375, 4.60400390625, 4.968017578125, 5.33203125, 5.696044921875, 6.06005859375, 6.424072265625, 6.7880859375, 7.152099609375, 7.51611328125, 7.880126953125, 8.244140625, 8.608154296875, 8.97216796875, 9.336181640625, 9.7001953125, 10.064208984375, 10.42822265625, 10.792236328125, 11.15625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 0.0, 8.0, 8.0, 1.0, 14.0, 9.0, 12.0, 10.0, 17.0, 22.0, 18.0, 24.0, 22.0, 32.0, 40.0, 46.0, 52.0, 70.0, 91.0, 136.0, 264.0, 472.0, 166.0, 72.0, 59.0, 41.0, 41.0, 30.0, 28.0, 35.0, 18.0, 25.0, 25.0, 17.0, 21.0, 13.0, 11.0, 13.0, 10.0, 10.0, 8.0, 6.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0], "bins": [-18.25, -17.7366943359375, -17.223388671875, -16.7100830078125, -16.19677734375, -15.6834716796875, -15.170166015625, -14.6568603515625, -14.1435546875, -13.6302490234375, -13.116943359375, -12.6036376953125, -12.09033203125, -11.5770263671875, -11.063720703125, -10.5504150390625, -10.037109375, -9.5238037109375, -9.010498046875, -8.4971923828125, -7.98388671875, -7.4705810546875, -6.957275390625, -6.4439697265625, -5.9306640625, -5.4173583984375, -4.904052734375, -4.3907470703125, -3.87744140625, -3.3641357421875, -2.850830078125, -2.3375244140625, -1.82421875, -1.3109130859375, -0.797607421875, -0.2843017578125, 0.22900390625, 0.7423095703125, 1.255615234375, 1.7689208984375, 2.2822265625, 2.7955322265625, 3.308837890625, 3.8221435546875, 4.33544921875, 4.8487548828125, 5.362060546875, 5.8753662109375, 6.388671875, 6.9019775390625, 7.415283203125, 7.9285888671875, 8.44189453125, 8.9552001953125, 9.468505859375, 9.9818115234375, 10.4951171875, 11.0084228515625, 11.521728515625, 12.0350341796875, 12.54833984375, 13.0616455078125, 13.574951171875, 14.0882568359375, 14.6015625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 5.0, 3.0, 5.0, 13.0, 11.0, 17.0, 22.0, 23.0, 17.0, 43.0, 36.0, 69.0, 67.0, 171.0, 218.0, 353.0, 509.0, 922.0, 1826.0, 4159.0, 12590.0, 66425.0, 6079180.0, 98468.0, 15820.0, 5432.0, 2281.0, 1120.0, 623.0, 362.0, 237.0, 112.0, 93.0, 48.0, 41.0, 17.0, 19.0, 22.0, 11.0, 10.0, 10.0, 9.0, 4.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-76.3125, -73.642578125, -70.97265625, -68.302734375, -65.6328125, -62.962890625, -60.29296875, -57.623046875, -54.953125, -52.283203125, -49.61328125, -46.943359375, -44.2734375, -41.603515625, -38.93359375, -36.263671875, -33.59375, -30.923828125, -28.25390625, -25.583984375, -22.9140625, -20.244140625, -17.57421875, -14.904296875, -12.234375, -9.564453125, -6.89453125, -4.224609375, -1.5546875, 1.115234375, 3.78515625, 6.455078125, 9.125, 11.794921875, 14.46484375, 17.134765625, 19.8046875, 22.474609375, 25.14453125, 27.814453125, 30.484375, 33.154296875, 35.82421875, 38.494140625, 41.1640625, 43.833984375, 46.50390625, 49.173828125, 51.84375, 54.513671875, 57.18359375, 59.853515625, 62.5234375, 65.193359375, 67.86328125, 70.533203125, 73.203125, 75.873046875, 78.54296875, 81.212890625, 83.8828125, 86.552734375, 89.22265625, 91.892578125, 94.5625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 10.0, 10.0, 20.0, 18.0, 18.0, 30.0, 46.0, 69.0, 92.0, 138.0, 271.0, 673.0, 205.0, 99.0, 74.0, 61.0, 49.0, 41.0, 23.0, 20.0, 14.0, 10.0, 8.0, 9.0, 6.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.46875, -30.6337890625, -29.798828125, -28.9638671875, -28.12890625, -27.2939453125, -26.458984375, -25.6240234375, -24.7890625, -23.9541015625, -23.119140625, -22.2841796875, -21.44921875, -20.6142578125, -19.779296875, -18.9443359375, -18.109375, -17.2744140625, -16.439453125, -15.6044921875, -14.76953125, -13.9345703125, -13.099609375, -12.2646484375, -11.4296875, -10.5947265625, -9.759765625, -8.9248046875, -8.08984375, -7.2548828125, -6.419921875, -5.5849609375, -4.75, -3.9150390625, -3.080078125, -2.2451171875, -1.41015625, -0.5751953125, 0.259765625, 1.0947265625, 1.9296875, 2.7646484375, 3.599609375, 4.4345703125, 5.26953125, 6.1044921875, 6.939453125, 7.7744140625, 8.609375, 9.4443359375, 10.279296875, 11.1142578125, 11.94921875, 12.7841796875, 13.619140625, 14.4541015625, 15.2890625, 16.1240234375, 16.958984375, 17.7939453125, 18.62890625, 19.4638671875, 20.298828125, 21.1337890625, 21.96875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 30.0, 120.0, 841.0, 13.0, 2.0, 3.0, 3.0], "bins": [-1123.0831298828125, -1104.1243896484375, -1085.16552734375, -1066.206787109375, -1047.248046875, -1028.2891845703125, -1009.3304443359375, -990.3716430664062, -971.412841796875, -952.4540405273438, -933.4952392578125, -914.5364990234375, -895.5776977539062, -876.618896484375, -857.66015625, -838.7013549804688, -819.7425537109375, -800.7837524414062, -781.824951171875, -762.8662109375, -743.9074096679688, -724.9486083984375, -705.9898681640625, -687.0310668945312, -668.072265625, -649.1134643554688, -630.1546630859375, -611.1959228515625, -592.2371215820312, -573.2783203125, -554.319580078125, -535.3607788085938, -516.4020385742188, -497.4432373046875, -478.4844665527344, -459.52569580078125, -440.56689453125, -421.60809326171875, -402.6493225097656, -383.6905517578125, -364.73175048828125, -345.77294921875, -326.8141784667969, -307.85540771484375, -288.8966064453125, -269.93780517578125, -250.97903442382812, -232.02024841308594, -213.06146240234375, -194.10267639160156, -175.14389038085938, -156.1851043701172, -137.226318359375, -118.26753234863281, -99.30874633789062, -80.34996032714844, -61.39117431640625, -42.43238830566406, -23.473602294921875, -4.5148162841796875, 14.4439697265625, 33.40275573730469, 52.361541748046875, 71.32032775878906, 90.27911376953125]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 5.0, 1.0, 3.0, 4.0, 8.0, 18.0, 14.0, 19.0, 44.0, 67.0, 115.0, 155.0, 174.0, 145.0, 97.0, 44.0, 26.0, 19.0, 13.0, 7.0, 5.0, 7.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.00408935546875, -52.73395919799805, -50.463829040527344, -48.19369888305664, -45.92356872558594, -43.653438568115234, -41.38330841064453, -39.11317443847656, -36.843048095703125, -34.57291793823242, -32.30278778076172, -30.032657623291016, -27.762527465820312, -25.49239730834961, -23.222265243530273, -20.95213508605957, -18.682003021240234, -16.41187286376953, -14.141742706298828, -11.871611595153809, -9.601481437683105, -7.331351280212402, -5.061220169067383, -2.7910900115966797, -0.5209598541259766, 1.7491705417633057, 4.019300937652588, 6.289431571960449, 8.559561729431152, 10.829691886901855, 13.099822998046875, 15.369953155517578, 17.64008331298828, 19.910213470458984, 22.180343627929688, 24.45047378540039, 26.720603942871094, 28.990734100341797, 31.260866165161133, 33.53099822998047, 35.801124572753906, 38.07125473022461, 40.34138488769531, 42.611515045166016, 44.88164520263672, 47.15177536010742, 49.421905517578125, 51.692039489746094, 53.9621696472168, 56.2322998046875, 58.5024299621582, 60.772560119628906, 63.04269027709961, 65.31282043457031, 67.58295440673828, 69.85308074951172, 72.12321472167969, 74.39334869384766, 76.6634750366211, 78.93360900878906, 81.2037353515625, 83.47386932373047, 85.7439956665039, 88.01412963867188, 90.28425598144531]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 7.0, 1.0, 7.0, 5.0, 7.0, 6.0, 9.0, 17.0, 15.0, 15.0, 21.0, 32.0, 46.0, 66.0, 86.0, 142.0, 195.0, 372.0, 668.0, 1582.0, 4768.0, 34847.0, 4079890.0, 60618.0, 6004.0, 2121.0, 1128.0, 624.0, 375.0, 211.0, 130.0, 77.0, 55.0, 30.0, 22.0, 17.0, 19.0, 13.0, 8.0, 3.0, 6.0, 3.0, 3.0, 2.0, 4.0, 2.0, 4.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.57763671875, -0.5581130981445312, -0.5385894775390625, -0.5190658569335938, -0.499542236328125, -0.48001861572265625, -0.4604949951171875, -0.44097137451171875, -0.42144775390625, -0.40192413330078125, -0.3824005126953125, -0.36287689208984375, -0.343353271484375, -0.32382965087890625, -0.3043060302734375, -0.28478240966796875, -0.2652587890625, -0.24573516845703125, -0.2262115478515625, -0.20668792724609375, -0.187164306640625, -0.16764068603515625, -0.1481170654296875, -0.12859344482421875, -0.10906982421875, -0.08954620361328125, -0.0700225830078125, -0.05049896240234375, -0.030975341796875, -0.01145172119140625, 0.0080718994140625, 0.02759552001953125, 0.047119140625, 0.06664276123046875, 0.0861663818359375, 0.10569000244140625, 0.125213623046875, 0.14473724365234375, 0.1642608642578125, 0.18378448486328125, 0.20330810546875, 0.22283172607421875, 0.2423553466796875, 0.26187896728515625, 0.281402587890625, 0.30092620849609375, 0.3204498291015625, 0.33997344970703125, 0.3594970703125, 0.37902069091796875, 0.3985443115234375, 0.41806793212890625, 0.437591552734375, 0.45711517333984375, 0.4766387939453125, 0.49616241455078125, 0.51568603515625, 0.5352096557617188, 0.5547332763671875, 0.5742568969726562, 0.593780517578125, 0.6133041381835938, 0.6328277587890625, 0.6523513793945312, 0.671875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 6.0, 8.0, 5.0, 12.0, 40.0, 124.0, 274.0, 294.0, 126.0, 47.0, 19.0, 7.0, 5.0, 5.0, 4.0, 5.0, 8.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019439697265625, -0.01877117156982422, -0.018102645874023438, -0.017434120178222656, -0.016765594482421875, -0.016097068786621094, -0.015428543090820312, -0.014760017395019531, -0.01409149169921875, -0.013422966003417969, -0.012754440307617188, -0.012085914611816406, -0.011417388916015625, -0.010748863220214844, -0.010080337524414062, -0.009411811828613281, -0.0087432861328125, -0.008074760437011719, -0.0074062347412109375, -0.006737709045410156, -0.006069183349609375, -0.005400657653808594, -0.0047321319580078125, -0.004063606262207031, -0.00339508056640625, -0.0027265548706054688, -0.0020580291748046875, -0.0013895034790039062, -0.000720977783203125, -5.245208740234375e-05, 0.0006160736083984375, 0.0012845993041992188, 0.001953125, 0.0026216506958007812, 0.0032901763916015625, 0.003958702087402344, 0.004627227783203125, 0.005295753479003906, 0.0059642791748046875, 0.006632804870605469, 0.00730133056640625, 0.007969856262207031, 0.008638381958007812, 0.009306907653808594, 0.009975433349609375, 0.010643959045410156, 0.011312484741210938, 0.011981010437011719, 0.0126495361328125, 0.013318061828613281, 0.013986587524414062, 0.014655113220214844, 0.015323638916015625, 0.015992164611816406, 0.016660690307617188, 0.01732921600341797, 0.01799774169921875, 0.01866626739501953, 0.019334793090820312, 0.020003318786621094, 0.020671844482421875, 0.021340370178222656, 0.022008895874023438, 0.02267742156982422, 0.023345947265625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 5.0, 1.0, 2.0, 6.0, 11.0, 12.0, 19.0, 23.0, 53.0, 88.0, 167.0, 458.0, 1370.0, 6766.0, 272799.0, 3895394.0, 13635.0, 2104.0, 684.0, 264.0, 121.0, 73.0, 39.0, 36.0, 23.0, 18.0, 14.0, 25.0, 17.0, 10.0, 7.0, 6.0, 7.0, 5.0, 6.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76123046875, -0.7309799194335938, -0.7007293701171875, -0.6704788208007812, -0.640228271484375, -0.6099777221679688, -0.5797271728515625, -0.5494766235351562, -0.51922607421875, -0.48897552490234375, -0.4587249755859375, -0.42847442626953125, -0.398223876953125, -0.36797332763671875, -0.3377227783203125, -0.30747222900390625, -0.2772216796875, -0.24697113037109375, -0.2167205810546875, -0.18647003173828125, -0.156219482421875, -0.12596893310546875, -0.0957183837890625, -0.06546783447265625, -0.03521728515625, -0.00496673583984375, 0.0252838134765625, 0.05553436279296875, 0.085784912109375, 0.11603546142578125, 0.1462860107421875, 0.17653656005859375, 0.206787109375, 0.23703765869140625, 0.2672882080078125, 0.29753875732421875, 0.327789306640625, 0.35803985595703125, 0.3882904052734375, 0.41854095458984375, 0.44879150390625, 0.47904205322265625, 0.5092926025390625, 0.5395431518554688, 0.569793701171875, 0.6000442504882812, 0.6302947998046875, 0.6605453491210938, 0.6907958984375, 0.7210464477539062, 0.7512969970703125, 0.7815475463867188, 0.811798095703125, 0.8420486450195312, 0.8722991943359375, 0.9025497436523438, 0.93280029296875, 0.9630508422851562, 0.9933013916015625, 1.0235519409179688, 1.053802490234375, 1.0840530395507812, 1.1143035888671875, 1.1445541381835938, 1.1748046875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 6.0, 7.0, 6.0, 13.0, 20.0, 18.0, 19.0, 15.0, 15.0, 35.0, 20.0, 52.0, 67.0, 91.0, 112.0, 167.0, 245.0, 417.0, 1185.0, 402.0, 328.0, 219.0, 180.0, 132.0, 78.0, 60.0, 42.0, 26.0, 22.0, 18.0, 12.0, 9.0, 8.0, 6.0, 3.0, 4.0, 2.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.045806884765625, -0.04447603225708008, -0.043145179748535156, -0.041814327239990234, -0.04048347473144531, -0.03915262222290039, -0.03782176971435547, -0.03649091720581055, -0.035160064697265625, -0.0338292121887207, -0.03249835968017578, -0.03116750717163086, -0.029836654663085938, -0.028505802154541016, -0.027174949645996094, -0.025844097137451172, -0.02451324462890625, -0.023182392120361328, -0.021851539611816406, -0.020520687103271484, -0.019189834594726562, -0.01785898208618164, -0.01652812957763672, -0.015197277069091797, -0.013866424560546875, -0.012535572052001953, -0.011204719543457031, -0.00987386703491211, -0.008543014526367188, -0.007212162017822266, -0.005881309509277344, -0.004550457000732422, -0.0032196044921875, -0.0018887519836425781, -0.0005578994750976562, 0.0007729530334472656, 0.0021038055419921875, 0.0034346580505371094, 0.004765510559082031, 0.006096363067626953, 0.007427215576171875, 0.008758068084716797, 0.010088920593261719, 0.01141977310180664, 0.012750625610351562, 0.014081478118896484, 0.015412330627441406, 0.016743183135986328, 0.01807403564453125, 0.019404888153076172, 0.020735740661621094, 0.022066593170166016, 0.023397445678710938, 0.02472829818725586, 0.02605915069580078, 0.027390003204345703, 0.028720855712890625, 0.030051708221435547, 0.03138256072998047, 0.03271341323852539, 0.03404426574707031, 0.035375118255615234, 0.036705970764160156, 0.03803682327270508, 0.03936767578125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 1.0, 28.0, 71.0, 305.0, 441.0, 124.0, 15.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9884470701217651, -1.931984305381775, -1.8755216598510742, -1.819058895111084, -1.7625961303710938, -1.7061333656311035, -1.6496707201004028, -1.5932079553604126, -1.536745309829712, -1.4802825450897217, -1.423819899559021, -1.3673571348190308, -1.3108943700790405, -1.2544317245483398, -1.1979689598083496, -1.1415061950683594, -1.0850434303283691, -1.028580665588379, -0.9721179604530334, -0.915655255317688, -0.8591924905776978, -0.8027297854423523, -0.7462670803070068, -0.6898043155670166, -0.6333416104316711, -0.5768789052963257, -0.5204161405563354, -0.46395343542099, -0.40749070048332214, -0.3510279655456543, -0.29456526041030884, -0.238102525472641, -0.1816396713256836, -0.12517693638801575, -0.0687142163515091, -0.012251496315002441, 0.044211238622665405, 0.10067397356033325, 0.1571366786956787, 0.21359941363334656, 0.2700621485710144, 0.32652488350868225, 0.3829876184463501, 0.43945032358169556, 0.4959130585193634, 0.5523757934570312, 0.6088384985923767, 0.6653012037277222, 0.7217639684677124, 0.7782266736030579, 0.8346894383430481, 0.8911521434783936, 0.9476149082183838, 1.004077672958374, 1.0605403184890747, 1.117003083229065, 1.1734657287597656, 1.2299284934997559, 1.2863911390304565, 1.3428539037704468, 1.399316668510437, 1.4557793140411377, 1.512242078781128, 1.5687048435211182, 1.6251676082611084]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 8.0, 10.0, 23.0, 25.0, 33.0, 42.0, 72.0, 91.0, 101.0, 104.0, 103.0, 74.0, 92.0, 77.0, 50.0, 36.0, 19.0, 14.0, 14.0, 12.0, 2.0, 3.0, 0.0, 4.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22400879859924316, -0.20970305800437927, -0.1953973025083542, -0.1810915619134903, -0.1667858213186264, -0.15248006582260132, -0.13817432522773743, -0.12386858463287354, -0.10956283658742905, -0.09525708854198456, -0.08095134794712067, -0.06664559990167618, -0.05233985558152199, -0.0380341112613678, -0.02372836321592331, -0.009422622621059418, 0.004883125424385071, 0.01918886974453926, 0.03349461406469345, 0.04780036211013794, 0.06210610643029213, 0.07641185075044632, 0.09071759879589081, 0.1050233393907547, 0.11932908743619919, 0.13363483548164368, 0.14794057607650757, 0.16224631667137146, 0.17655207216739655, 0.19085781276226044, 0.20516356825828552, 0.21946930885314941, 0.2337750494480133, 0.2480807900428772, 0.2623865306377411, 0.276692271232605, 0.29099804162979126, 0.30530378222465515, 0.31960952281951904, 0.33391526341438293, 0.3482210040092468, 0.3625267446041107, 0.3768324851989746, 0.3911382555961609, 0.4054439961910248, 0.41974973678588867, 0.43405547738075256, 0.44836121797561646, 0.46266698837280273, 0.4769727289676666, 0.4912784695625305, 0.5055842399597168, 0.5198899507522583, 0.5341957211494446, 0.5485014915466309, 0.5628072023391724, 0.5771129131317139, 0.5914186835289001, 0.6057243943214417, 0.6200301647186279, 0.6343358755111694, 0.6486416459083557, 0.662947416305542, 0.6772531270980835, 0.6915588974952698]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 2.0, 5.0, 4.0, 6.0, 10.0, 13.0, 11.0, 22.0, 36.0, 55.0, 78.0, 115.0, 249.0, 415.0, 862.0, 2362.0, 8865.0, 826277.0, 197687.0, 7572.0, 2171.0, 801.0, 366.0, 208.0, 109.0, 63.0, 57.0, 33.0, 24.0, 15.0, 13.0, 12.0, 9.0, 6.0, 3.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4052734375, -1.3626251220703125, -1.319976806640625, -1.2773284912109375, -1.23468017578125, -1.1920318603515625, -1.149383544921875, -1.1067352294921875, -1.0640869140625, -1.0214385986328125, -0.978790283203125, -0.9361419677734375, -0.89349365234375, -0.8508453369140625, -0.808197021484375, -0.7655487060546875, -0.722900390625, -0.6802520751953125, -0.637603759765625, -0.5949554443359375, -0.55230712890625, -0.5096588134765625, -0.467010498046875, -0.4243621826171875, -0.3817138671875, -0.3390655517578125, -0.296417236328125, -0.2537689208984375, -0.21112060546875, -0.1684722900390625, -0.125823974609375, -0.0831756591796875, -0.04052734375, 0.0021209716796875, 0.044769287109375, 0.0874176025390625, 0.13006591796875, 0.1727142333984375, 0.215362548828125, 0.2580108642578125, 0.3006591796875, 0.3433074951171875, 0.385955810546875, 0.4286041259765625, 0.47125244140625, 0.5139007568359375, 0.556549072265625, 0.5991973876953125, 0.641845703125, 0.6844940185546875, 0.727142333984375, 0.7697906494140625, 0.81243896484375, 0.8550872802734375, 0.897735595703125, 0.9403839111328125, 0.9830322265625, 1.0256805419921875, 1.068328857421875, 1.1109771728515625, 1.15362548828125, 1.1962738037109375, 1.238922119140625, 1.2815704345703125, 1.32421875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 6.0, 12.0, 5.0, 15.0, 25.0, 73.0, 167.0, 254.0, 214.0, 120.0, 50.0, 20.0, 9.0, 4.0, 7.0, 3.0, 7.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01885986328125, -0.01820540428161621, -0.017550945281982422, -0.016896486282348633, -0.016242027282714844, -0.015587568283081055, -0.014933109283447266, -0.014278650283813477, -0.013624191284179688, -0.012969732284545898, -0.01231527328491211, -0.01166081428527832, -0.011006355285644531, -0.010351896286010742, -0.009697437286376953, -0.009042978286743164, -0.008388519287109375, -0.007734060287475586, -0.007079601287841797, -0.006425142288208008, -0.005770683288574219, -0.00511622428894043, -0.004461765289306641, -0.0038073062896728516, -0.0031528472900390625, -0.0024983882904052734, -0.0018439292907714844, -0.0011894702911376953, -0.0005350112915039062, 0.00011944770812988281, 0.0007739067077636719, 0.001428365707397461, 0.00208282470703125, 0.002737283706665039, 0.003391742706298828, 0.004046201705932617, 0.004700660705566406, 0.005355119705200195, 0.006009578704833984, 0.0066640377044677734, 0.0073184967041015625, 0.007972955703735352, 0.00862741470336914, 0.00928187370300293, 0.009936332702636719, 0.010590791702270508, 0.011245250701904297, 0.011899709701538086, 0.012554168701171875, 0.013208627700805664, 0.013863086700439453, 0.014517545700073242, 0.015172004699707031, 0.01582646369934082, 0.01648092269897461, 0.0171353816986084, 0.017789840698242188, 0.018444299697875977, 0.019098758697509766, 0.019753217697143555, 0.020407676696777344, 0.021062135696411133, 0.021716594696044922, 0.02237105369567871, 0.0230255126953125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 10.0, 7.0, 10.0, 11.0, 15.0, 21.0, 38.0, 35.0, 40.0, 63.0, 86.0, 111.0, 141.0, 240.0, 349.0, 596.0, 868.0, 1615.0, 3517.0, 9677.0, 34186.0, 259048.0, 667256.0, 48468.0, 12931.0, 4326.0, 1956.0, 1008.0, 587.0, 417.0, 259.0, 167.0, 126.0, 101.0, 72.0, 51.0, 30.0, 42.0, 17.0, 17.0, 16.0, 6.0, 4.0, 8.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.74169921875, -0.717864990234375, -0.69403076171875, -0.670196533203125, -0.6463623046875, -0.622528076171875, -0.59869384765625, -0.574859619140625, -0.551025390625, -0.527191162109375, -0.50335693359375, -0.479522705078125, -0.4556884765625, -0.431854248046875, -0.40802001953125, -0.384185791015625, -0.3603515625, -0.336517333984375, -0.31268310546875, -0.288848876953125, -0.2650146484375, -0.241180419921875, -0.21734619140625, -0.193511962890625, -0.169677734375, -0.145843505859375, -0.12200927734375, -0.098175048828125, -0.0743408203125, -0.050506591796875, -0.02667236328125, -0.002838134765625, 0.02099609375, 0.044830322265625, 0.06866455078125, 0.092498779296875, 0.1163330078125, 0.140167236328125, 0.16400146484375, 0.187835693359375, 0.211669921875, 0.235504150390625, 0.25933837890625, 0.283172607421875, 0.3070068359375, 0.330841064453125, 0.35467529296875, 0.378509521484375, 0.40234375, 0.426177978515625, 0.45001220703125, 0.473846435546875, 0.4976806640625, 0.521514892578125, 0.54534912109375, 0.569183349609375, 0.593017578125, 0.616851806640625, 0.64068603515625, 0.664520263671875, 0.6883544921875, 0.712188720703125, 0.73602294921875, 0.759857177734375, 0.78369140625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 7.0, 4.0, 8.0, 0.0, 14.0, 16.0, 15.0, 14.0, 18.0, 19.0, 33.0, 26.0, 42.0, 39.0, 27.0, 39.0, 35.0, 41.0, 41.0, 51.0, 44.0, 55.0, 46.0, 36.0, 36.0, 39.0, 35.0, 42.0, 26.0, 24.0, 23.0, 26.0, 19.0, 17.0, 8.0, 12.0, 9.0, 7.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.07110595703125, -0.06909656524658203, -0.06708717346191406, -0.0650777816772461, -0.06306838989257812, -0.061058998107910156, -0.05904960632324219, -0.05704021453857422, -0.05503082275390625, -0.05302143096923828, -0.05101203918457031, -0.049002647399902344, -0.046993255615234375, -0.044983863830566406, -0.04297447204589844, -0.04096508026123047, -0.0389556884765625, -0.03694629669189453, -0.03493690490722656, -0.032927513122558594, -0.030918121337890625, -0.028908729553222656, -0.026899337768554688, -0.02488994598388672, -0.02288055419921875, -0.02087116241455078, -0.018861770629882812, -0.016852378845214844, -0.014842987060546875, -0.012833595275878906, -0.010824203491210938, -0.008814811706542969, -0.006805419921875, -0.004796028137207031, -0.0027866363525390625, -0.0007772445678710938, 0.001232147216796875, 0.0032415390014648438, 0.0052509307861328125, 0.007260322570800781, 0.00926971435546875, 0.011279106140136719, 0.013288497924804688, 0.015297889709472656, 0.017307281494140625, 0.019316673278808594, 0.021326065063476562, 0.02333545684814453, 0.0253448486328125, 0.02735424041748047, 0.029363632202148438, 0.031373023986816406, 0.033382415771484375, 0.035391807556152344, 0.03740119934082031, 0.03941059112548828, 0.04141998291015625, 0.04342937469482422, 0.04543876647949219, 0.047448158264160156, 0.049457550048828125, 0.051466941833496094, 0.05347633361816406, 0.05548572540283203, 0.0574951171875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 6.0, 7.0, 10.0, 17.0, 21.0, 25.0, 28.0, 43.0, 72.0, 120.0, 182.0, 332.0, 573.0, 1133.0, 3139.0, 11685.0, 132588.0, 867576.0, 22803.0, 4792.0, 1614.0, 751.0, 351.0, 241.0, 145.0, 84.0, 62.0, 43.0, 31.0, 20.0, 12.0, 14.0, 8.0, 4.0, 4.0, 8.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.2578125, -3.162506103515625, -3.06719970703125, -2.971893310546875, -2.8765869140625, -2.781280517578125, -2.68597412109375, -2.590667724609375, -2.495361328125, -2.400054931640625, -2.30474853515625, -2.209442138671875, -2.1141357421875, -2.018829345703125, -1.92352294921875, -1.828216552734375, -1.73291015625, -1.637603759765625, -1.54229736328125, -1.446990966796875, -1.3516845703125, -1.256378173828125, -1.16107177734375, -1.065765380859375, -0.970458984375, -0.875152587890625, -0.77984619140625, -0.684539794921875, -0.5892333984375, -0.493927001953125, -0.39862060546875, -0.303314208984375, -0.2080078125, -0.112701416015625, -0.01739501953125, 0.077911376953125, 0.1732177734375, 0.268524169921875, 0.36383056640625, 0.459136962890625, 0.554443359375, 0.649749755859375, 0.74505615234375, 0.840362548828125, 0.9356689453125, 1.030975341796875, 1.12628173828125, 1.221588134765625, 1.31689453125, 1.412200927734375, 1.50750732421875, 1.602813720703125, 1.6981201171875, 1.793426513671875, 1.88873291015625, 1.984039306640625, 2.079345703125, 2.174652099609375, 2.26995849609375, 2.365264892578125, 2.4605712890625, 2.555877685546875, 2.65118408203125, 2.746490478515625, 2.841796875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 5.0, 6.0, 7.0, 7.0, 8.0, 7.0, 11.0, 23.0, 28.0, 26.0, 44.0, 81.0, 164.0, 292.0, 94.0, 43.0, 39.0, 23.0, 26.0, 19.0, 12.0, 12.0, 9.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00018405914306640625, -0.00017911195755004883, -0.0001741647720336914, -0.00016921758651733398, -0.00016427040100097656, -0.00015932321548461914, -0.00015437602996826172, -0.0001494288444519043, -0.00014448165893554688, -0.00013953447341918945, -0.00013458728790283203, -0.0001296401023864746, -0.0001246929168701172, -0.00011974573135375977, -0.00011479854583740234, -0.00010985136032104492, -0.0001049041748046875, -9.995698928833008e-05, -9.500980377197266e-05, -9.006261825561523e-05, -8.511543273925781e-05, -8.016824722290039e-05, -7.522106170654297e-05, -7.027387619018555e-05, -6.532669067382812e-05, -6.03795051574707e-05, -5.543231964111328e-05, -5.048513412475586e-05, -4.553794860839844e-05, -4.0590763092041016e-05, -3.5643577575683594e-05, -3.069639205932617e-05, -2.574920654296875e-05, -2.0802021026611328e-05, -1.5854835510253906e-05, -1.0907649993896484e-05, -5.9604644775390625e-06, -1.0132789611816406e-06, 3.933906555175781e-06, 8.881092071533203e-06, 1.3828277587890625e-05, 1.8775463104248047e-05, 2.372264862060547e-05, 2.866983413696289e-05, 3.361701965332031e-05, 3.8564205169677734e-05, 4.3511390686035156e-05, 4.845857620239258e-05, 5.340576171875e-05, 5.835294723510742e-05, 6.330013275146484e-05, 6.824731826782227e-05, 7.319450378417969e-05, 7.814168930053711e-05, 8.308887481689453e-05, 8.803606033325195e-05, 9.298324584960938e-05, 9.79304313659668e-05, 0.00010287761688232422, 0.00010782480239868164, 0.00011277198791503906, 0.00011771917343139648, 0.0001226663589477539, 0.00012761354446411133, 0.00013256072998046875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 6.0, 4.0, 7.0, 8.0, 18.0, 26.0, 32.0, 82.0, 137.0, 225.0, 449.0, 1001.0, 2866.0, 16295.0, 992580.0, 28571.0, 3877.0, 1263.0, 514.0, 234.0, 140.0, 78.0, 48.0, 39.0, 18.0, 19.0, 3.0, 7.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.453125, -5.2999267578125, -5.146728515625, -4.9935302734375, -4.84033203125, -4.6871337890625, -4.533935546875, -4.3807373046875, -4.2275390625, -4.0743408203125, -3.921142578125, -3.7679443359375, -3.61474609375, -3.4615478515625, -3.308349609375, -3.1551513671875, -3.001953125, -2.8487548828125, -2.695556640625, -2.5423583984375, -2.38916015625, -2.2359619140625, -2.082763671875, -1.9295654296875, -1.7763671875, -1.6231689453125, -1.469970703125, -1.3167724609375, -1.16357421875, -1.0103759765625, -0.857177734375, -0.7039794921875, -0.55078125, -0.3975830078125, -0.244384765625, -0.0911865234375, 0.06201171875, 0.2152099609375, 0.368408203125, 0.5216064453125, 0.6748046875, 0.8280029296875, 0.981201171875, 1.1343994140625, 1.28759765625, 1.4407958984375, 1.593994140625, 1.7471923828125, 1.900390625, 2.0535888671875, 2.206787109375, 2.3599853515625, 2.51318359375, 2.6663818359375, 2.819580078125, 2.9727783203125, 3.1259765625, 3.2791748046875, 3.432373046875, 3.5855712890625, 3.73876953125, 3.8919677734375, 4.045166015625, 4.1983642578125, 4.3515625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 6.0, 8.0, 19.0, 18.0, 43.0, 56.0, 64.0, 133.0, 219.0, 116.0, 83.0, 63.0, 37.0, 32.0, 24.0, 20.0, 12.0, 13.0, 7.0, 14.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0986328125, -1.06689453125, -1.03515625, -1.00341796875, -0.9716796875, -0.93994140625, -0.908203125, -0.87646484375, -0.8447265625, -0.81298828125, -0.78125, -0.74951171875, -0.7177734375, -0.68603515625, -0.654296875, -0.62255859375, -0.5908203125, -0.55908203125, -0.52734375, -0.49560546875, -0.4638671875, -0.43212890625, -0.400390625, -0.36865234375, -0.3369140625, -0.30517578125, -0.2734375, -0.24169921875, -0.2099609375, -0.17822265625, -0.146484375, -0.11474609375, -0.0830078125, -0.05126953125, -0.01953125, 0.01220703125, 0.0439453125, 0.07568359375, 0.107421875, 0.13916015625, 0.1708984375, 0.20263671875, 0.234375, 0.26611328125, 0.2978515625, 0.32958984375, 0.361328125, 0.39306640625, 0.4248046875, 0.45654296875, 0.48828125, 0.52001953125, 0.5517578125, 0.58349609375, 0.615234375, 0.64697265625, 0.6787109375, 0.71044921875, 0.7421875, 0.77392578125, 0.8056640625, 0.83740234375, 0.869140625, 0.90087890625, 0.9326171875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 4.0, 10.0, 17.0, 38.0, 50.0, 113.0, 260.0, 383.0, 89.0, 25.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.10936737060547, -19.61117935180664, -19.112993240356445, -18.61480712890625, -18.116619110107422, -17.618431091308594, -17.1202449798584, -16.622058868408203, -16.123870849609375, -15.625683784484863, -15.127496719360352, -14.62930965423584, -14.131122589111328, -13.632935523986816, -13.134748458862305, -12.636561393737793, -12.138374328613281, -11.64018726348877, -11.142000198364258, -10.643813133239746, -10.145626068115234, -9.647439002990723, -9.149251937866211, -8.6510648727417, -8.152877807617188, -7.654690742492676, -7.156503677368164, -6.658316612243652, -6.160129547119141, -5.661942481994629, -5.163755416870117, -4.6655683517456055, -4.167380332946777, -3.6691932678222656, -3.171006202697754, -2.672819137573242, -2.1746320724487305, -1.6764450073242188, -1.178257942199707, -0.6800708770751953, -0.1818838119506836, 0.3163032531738281, 0.8144903182983398, 1.3126773834228516, 1.8108644485473633, 2.309051513671875, 2.8072385787963867, 3.3054256439208984, 3.80361270904541, 4.301799774169922, 4.799986839294434, 5.298173904418945, 5.796360969543457, 6.294548034667969, 6.7927350997924805, 7.290922164916992, 7.789109230041504, 8.287296295166016, 8.785483360290527, 9.283670425415039, 9.78185749053955, 10.280044555664062, 10.778231620788574, 11.276418685913086, 11.774605751037598]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 11.0, 14.0, 17.0, 19.0, 31.0, 41.0, 60.0, 66.0, 66.0, 86.0, 72.0, 80.0, 78.0, 84.0, 74.0, 53.0, 38.0, 33.0, 27.0, 12.0, 10.0, 10.0, 6.0, 10.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.461606025695801, -3.358848810195923, -3.256091594696045, -3.153334379196167, -3.050577163696289, -2.947819948196411, -2.845062732696533, -2.7423055171966553, -2.6395483016967773, -2.5367910861968994, -2.4340338706970215, -2.3312766551971436, -2.2285194396972656, -2.1257622241973877, -2.0230050086975098, -1.9202477931976318, -1.817490577697754, -1.714733362197876, -1.611976146697998, -1.5092189311981201, -1.4064617156982422, -1.3037045001983643, -1.2009472846984863, -1.0981900691986084, -0.9954328536987305, -0.8926756381988525, -0.7899184226989746, -0.6871612071990967, -0.5844039916992188, -0.4816467761993408, -0.3788895606994629, -0.27613234519958496, -0.17337489128112793, -0.07061767578125, 0.03213953971862793, 0.13489675521850586, 0.2376539707183838, 0.3404111862182617, 0.44316840171813965, 0.5459256172180176, 0.6486828327178955, 0.7514400482177734, 0.8541972637176514, 0.9569544792175293, 1.0597116947174072, 1.1624689102172852, 1.265226125717163, 1.367983341217041, 1.470740556716919, 1.5734977722167969, 1.6762549877166748, 1.7790122032165527, 1.8817694187164307, 1.9845266342163086, 2.0872838497161865, 2.1900410652160645, 2.2927982807159424, 2.3955554962158203, 2.4983127117156982, 2.601069927215576, 2.703827142715454, 2.806584358215332, 2.90934157371521, 3.012098789215088, 3.114856004714966]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 4.0, 4.0, 11.0, 17.0, 24.0, 50.0, 161.0, 1329.0, 4139001.0, 52898.0, 587.0, 73.0, 34.0, 21.0, 17.0, 10.0, 9.0, 6.0, 3.0, 3.0, 6.0, 3.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.6875, -25.899658203125, -25.11181640625, -24.323974609375, -23.5361328125, -22.748291015625, -21.96044921875, -21.172607421875, -20.384765625, -19.596923828125, -18.80908203125, -18.021240234375, -17.2333984375, -16.445556640625, -15.65771484375, -14.869873046875, -14.08203125, -13.294189453125, -12.50634765625, -11.718505859375, -10.9306640625, -10.142822265625, -9.35498046875, -8.567138671875, -7.779296875, -6.991455078125, -6.20361328125, -5.415771484375, -4.6279296875, -3.840087890625, -3.05224609375, -2.264404296875, -1.4765625, -0.688720703125, 0.09912109375, 0.886962890625, 1.6748046875, 2.462646484375, 3.25048828125, 4.038330078125, 4.826171875, 5.614013671875, 6.40185546875, 7.189697265625, 7.9775390625, 8.765380859375, 9.55322265625, 10.341064453125, 11.12890625, 11.916748046875, 12.70458984375, 13.492431640625, 14.2802734375, 15.068115234375, 15.85595703125, 16.643798828125, 17.431640625, 18.219482421875, 19.00732421875, 19.795166015625, 20.5830078125, 21.370849609375, 22.15869140625, 22.946533203125, 23.734375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 4.0, 4.0, 8.0, 11.0, 12.0, 10.0, 36.0, 56.0, 82.0, 103.0, 145.0, 134.0, 108.0, 94.0, 58.0, 46.0, 11.0, 11.0, 16.0, 5.0, 8.0, 3.0, 8.0, 5.0, 7.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038330078125, -0.03702497482299805, -0.035719871520996094, -0.03441476821899414, -0.03310966491699219, -0.031804561614990234, -0.03049945831298828, -0.029194355010986328, -0.027889251708984375, -0.026584148406982422, -0.02527904510498047, -0.023973941802978516, -0.022668838500976562, -0.02136373519897461, -0.020058631896972656, -0.018753528594970703, -0.01744842529296875, -0.016143321990966797, -0.014838218688964844, -0.01353311538696289, -0.012228012084960938, -0.010922908782958984, -0.009617805480957031, -0.008312702178955078, -0.007007598876953125, -0.005702495574951172, -0.004397392272949219, -0.0030922889709472656, -0.0017871856689453125, -0.0004820823669433594, 0.0008230209350585938, 0.002128124237060547, 0.0034332275390625, 0.004738330841064453, 0.006043434143066406, 0.007348537445068359, 0.008653640747070312, 0.009958744049072266, 0.011263847351074219, 0.012568950653076172, 0.013874053955078125, 0.015179157257080078, 0.01648426055908203, 0.017789363861083984, 0.019094467163085938, 0.02039957046508789, 0.021704673767089844, 0.023009777069091797, 0.02431488037109375, 0.025619983673095703, 0.026925086975097656, 0.02823019027709961, 0.029535293579101562, 0.030840396881103516, 0.03214550018310547, 0.03345060348510742, 0.034755706787109375, 0.03606081008911133, 0.03736591339111328, 0.038671016693115234, 0.03997611999511719, 0.04128122329711914, 0.042586326599121094, 0.04389142990112305, 0.045196533203125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 6.0, 15.0, 26.0, 54.0, 126.0, 290.0, 4404.0, 4171566.0, 16830.0, 568.0, 198.0, 114.0, 51.0, 26.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.33984375, -5.03680419921875, -4.7337646484375, -4.43072509765625, -4.127685546875, -3.82464599609375, -3.5216064453125, -3.21856689453125, -2.91552734375, -2.61248779296875, -2.3094482421875, -2.00640869140625, -1.703369140625, -1.40032958984375, -1.0972900390625, -0.79425048828125, -0.4912109375, -0.18817138671875, 0.1148681640625, 0.41790771484375, 0.720947265625, 1.02398681640625, 1.3270263671875, 1.63006591796875, 1.93310546875, 2.23614501953125, 2.5391845703125, 2.84222412109375, 3.145263671875, 3.44830322265625, 3.7513427734375, 4.05438232421875, 4.357421875, 4.66046142578125, 4.9635009765625, 5.26654052734375, 5.569580078125, 5.87261962890625, 6.1756591796875, 6.47869873046875, 6.78173828125, 7.08477783203125, 7.3878173828125, 7.69085693359375, 7.993896484375, 8.29693603515625, 8.5999755859375, 8.90301513671875, 9.2060546875, 9.50909423828125, 9.8121337890625, 10.11517333984375, 10.418212890625, 10.72125244140625, 11.0242919921875, 11.32733154296875, 11.63037109375, 11.93341064453125, 12.2364501953125, 12.53948974609375, 12.842529296875, 13.14556884765625, 13.4486083984375, 13.75164794921875, 14.0546875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 3.0, 4.0, 7.0, 11.0, 7.0, 13.0, 14.0, 16.0, 20.0, 25.0, 41.0, 61.0, 107.0, 189.0, 392.0, 1756.0, 649.0, 292.0, 169.0, 85.0, 57.0, 31.0, 37.0, 17.0, 17.0, 9.0, 12.0, 4.0, 10.0, 3.0, 4.0, 3.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1202392578125, -0.11618995666503906, -0.11214065551757812, -0.10809135437011719, -0.10404205322265625, -0.09999275207519531, -0.09594345092773438, -0.09189414978027344, -0.0878448486328125, -0.08379554748535156, -0.07974624633789062, -0.07569694519042969, -0.07164764404296875, -0.06759834289550781, -0.06354904174804688, -0.05949974060058594, -0.055450439453125, -0.05140113830566406, -0.047351837158203125, -0.04330253601074219, -0.03925323486328125, -0.03520393371582031, -0.031154632568359375, -0.027105331420898438, -0.0230560302734375, -0.019006729125976562, -0.014957427978515625, -0.010908126831054688, -0.00685882568359375, -0.0028095245361328125, 0.001239776611328125, 0.0052890777587890625, 0.00933837890625, 0.013387680053710938, 0.017436981201171875, 0.021486282348632812, 0.02553558349609375, 0.029584884643554688, 0.033634185791015625, 0.03768348693847656, 0.0417327880859375, 0.04578208923339844, 0.049831390380859375, 0.05388069152832031, 0.05792999267578125, 0.06197929382324219, 0.06602859497070312, 0.07007789611816406, 0.074127197265625, 0.07817649841308594, 0.08222579956054688, 0.08627510070800781, 0.09032440185546875, 0.09437370300292969, 0.09842300415039062, 0.10247230529785156, 0.1065216064453125, 0.11057090759277344, 0.11462020874023438, 0.11866950988769531, 0.12271881103515625, 0.1267681121826172, 0.13081741333007812, 0.13486671447753906, 0.138916015625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 328.0, 671.0, 18.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7741808891296387, -2.0824437141418457, -1.3907063007354736, -0.6989688873291016, -0.007231712341308594, 0.6845054626464844, 1.3762431144714355, 2.0679802894592285, 2.7597174644470215, 3.4514546394348145, 4.143192291259766, 4.834929466247559, 5.526666641235352, 6.2184038162231445, 6.910141468048096, 7.601878643035889, 8.293615341186523, 8.985352516174316, 9.67708969116211, 10.368827819824219, 11.060564041137695, 11.752302169799805, 12.444039344787598, 13.13577651977539, 13.8275146484375, 14.519251823425293, 15.210988998413086, 15.902727127075195, 16.594463348388672, 17.28620147705078, 17.97793960571289, 18.669675827026367, 19.361412048339844, 20.053150177001953, 20.74488639831543, 21.43662452697754, 22.128360748291016, 22.820098876953125, 23.511837005615234, 24.20357322692871, 24.895309448242188, 25.587047576904297, 26.278783798217773, 26.970521926879883, 27.66225814819336, 28.35399627685547, 29.045734405517578, 29.737470626831055, 30.429208755493164, 31.120946884155273, 31.81268310546875, 32.50442123413086, 33.19615936279297, 33.88789367675781, 34.57963180541992, 35.27136993408203, 35.96310806274414, 36.65484619140625, 37.34658432006836, 38.0383186340332, 38.73005676269531, 39.42179489135742, 40.11353302001953, 40.805267333984375, 41.497005462646484]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 6.0, 9.0, 18.0, 33.0, 50.0, 79.0, 137.0, 162.0, 146.0, 130.0, 92.0, 64.0, 37.0, 27.0, 11.0, 5.0, 9.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6058304309844971, -0.5424944758415222, -0.47915852069854736, -0.4158225953578949, -0.35248664021492004, -0.2891506850719452, -0.22581475973129272, -0.16247880458831787, -0.09914284944534302, -0.03580690175294876, 0.027529045939445496, 0.09086498618125916, 0.154200941324234, 0.21753689646720886, 0.28087282180786133, 0.3442087769508362, 0.40754473209381104, 0.4708806872367859, 0.5342166423797607, 0.5975525379180908, 0.6608885526657104, 0.7242244482040405, 0.7875604033470154, 0.8508963584899902, 0.9142323136329651, 0.9775682687759399, 1.04090416431427, 1.1042401790618896, 1.1675760746002197, 1.2309120893478394, 1.2942479848861694, 1.357583999633789, 1.4209198951721191, 1.4842557907104492, 1.5475918054580688, 1.610927700996399, 1.6742637157440186, 1.7375996112823486, 1.8009355068206787, 1.8642715215682983, 1.927607536315918, 1.990943431854248, 2.054279327392578, 2.1176154613494873, 2.1809513568878174, 2.2442872524261475, 2.3076231479644775, 2.3709592819213867, 2.434295177459717, 2.497631072998047, 2.560966968536377, 2.624303102493286, 2.687638998031616, 2.7509748935699463, 2.8143107891082764, 2.8776469230651855, 2.9409825801849365, 3.0043184757232666, 3.0676543712615967, 3.130990505218506, 3.194326400756836, 3.257662296295166, 3.320998191833496, 3.384334087371826, 3.4476702213287354]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 5.0, 5.0, 3.0, 8.0, 11.0, 7.0, 10.0, 13.0, 17.0, 22.0, 24.0, 46.0, 41.0, 68.0, 105.0, 162.0, 355.0, 608.0, 1363.0, 4004.0, 20563.0, 718051.0, 284294.0, 13247.0, 3107.0, 1171.0, 497.0, 241.0, 148.0, 98.0, 65.0, 41.0, 43.0, 29.0, 24.0, 15.0, 11.0, 10.0, 7.0, 5.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.234375, -2.15704345703125, -2.0797119140625, -2.00238037109375, -1.925048828125, -1.84771728515625, -1.7703857421875, -1.69305419921875, -1.61572265625, -1.53839111328125, -1.4610595703125, -1.38372802734375, -1.306396484375, -1.22906494140625, -1.1517333984375, -1.07440185546875, -0.9970703125, -0.91973876953125, -0.8424072265625, -0.76507568359375, -0.687744140625, -0.61041259765625, -0.5330810546875, -0.45574951171875, -0.37841796875, -0.30108642578125, -0.2237548828125, -0.14642333984375, -0.069091796875, 0.00823974609375, 0.0855712890625, 0.16290283203125, 0.240234375, 0.31756591796875, 0.3948974609375, 0.47222900390625, 0.549560546875, 0.62689208984375, 0.7042236328125, 0.78155517578125, 0.85888671875, 0.93621826171875, 1.0135498046875, 1.09088134765625, 1.168212890625, 1.24554443359375, 1.3228759765625, 1.40020751953125, 1.4775390625, 1.55487060546875, 1.6322021484375, 1.70953369140625, 1.786865234375, 1.86419677734375, 1.9415283203125, 2.01885986328125, 2.09619140625, 2.17352294921875, 2.2508544921875, 2.32818603515625, 2.405517578125, 2.48284912109375, 2.5601806640625, 2.63751220703125, 2.71484375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 10.0, 16.0, 73.0, 141.0, 241.0, 236.0, 156.0, 77.0, 33.0, 15.0, 9.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0270233154296875, -0.023736238479614258, -0.020449161529541016, -0.017162084579467773, -0.013875007629394531, -0.010587930679321289, -0.007300853729248047, -0.004013776779174805, -0.0007266998291015625, 0.0025603771209716797, 0.005847454071044922, 0.009134531021118164, 0.012421607971191406, 0.01570868492126465, 0.01899576187133789, 0.022282838821411133, 0.025569915771484375, 0.028856992721557617, 0.03214406967163086, 0.0354311466217041, 0.038718223571777344, 0.042005300521850586, 0.04529237747192383, 0.04857945442199707, 0.05186653137207031, 0.055153608322143555, 0.0584406852722168, 0.06172776222229004, 0.06501483917236328, 0.06830191612243652, 0.07158899307250977, 0.07487607002258301, 0.07816314697265625, 0.08145022392272949, 0.08473730087280273, 0.08802437782287598, 0.09131145477294922, 0.09459853172302246, 0.0978856086730957, 0.10117268562316895, 0.10445976257324219, 0.10774683952331543, 0.11103391647338867, 0.11432099342346191, 0.11760807037353516, 0.1208951473236084, 0.12418222427368164, 0.12746930122375488, 0.13075637817382812, 0.13404345512390137, 0.1373305320739746, 0.14061760902404785, 0.1439046859741211, 0.14719176292419434, 0.15047883987426758, 0.15376591682434082, 0.15705299377441406, 0.1603400707244873, 0.16362714767456055, 0.1669142246246338, 0.17020130157470703, 0.17348837852478027, 0.17677545547485352, 0.18006253242492676, 0.183349609375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 4.0, 5.0, 6.0, 8.0, 7.0, 10.0, 18.0, 12.0, 15.0, 18.0, 17.0, 15.0, 33.0, 24.0, 39.0, 67.0, 169.0, 685.0, 6802.0, 821651.0, 214323.0, 3812.0, 447.0, 109.0, 41.0, 44.0, 27.0, 22.0, 24.0, 18.0, 9.0, 8.0, 12.0, 7.0, 10.0, 8.0, 6.0, 6.0, 2.0, 7.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.013671875, -2.92205810546875, -2.8304443359375, -2.73883056640625, -2.647216796875, -2.55560302734375, -2.4639892578125, -2.37237548828125, -2.28076171875, -2.18914794921875, -2.0975341796875, -2.00592041015625, -1.914306640625, -1.82269287109375, -1.7310791015625, -1.63946533203125, -1.5478515625, -1.45623779296875, -1.3646240234375, -1.27301025390625, -1.181396484375, -1.08978271484375, -0.9981689453125, -0.90655517578125, -0.81494140625, -0.72332763671875, -0.6317138671875, -0.54010009765625, -0.448486328125, -0.35687255859375, -0.2652587890625, -0.17364501953125, -0.08203125, 0.00958251953125, 0.1011962890625, 0.19281005859375, 0.284423828125, 0.37603759765625, 0.4676513671875, 0.55926513671875, 0.65087890625, 0.74249267578125, 0.8341064453125, 0.92572021484375, 1.017333984375, 1.10894775390625, 1.2005615234375, 1.29217529296875, 1.3837890625, 1.47540283203125, 1.5670166015625, 1.65863037109375, 1.750244140625, 1.84185791015625, 1.9334716796875, 2.02508544921875, 2.11669921875, 2.20831298828125, 2.2999267578125, 2.39154052734375, 2.483154296875, 2.57476806640625, 2.6663818359375, 2.75799560546875, 2.849609375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 3.0, 4.0, 6.0, 14.0, 8.0, 8.0, 16.0, 31.0, 26.0, 25.0, 45.0, 45.0, 58.0, 55.0, 58.0, 65.0, 47.0, 57.0, 53.0, 52.0, 49.0, 58.0, 46.0, 36.0, 28.0, 27.0, 21.0, 15.0, 12.0, 9.0, 6.0, 4.0, 4.0, 4.0, 2.0, 0.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.166748046875, -0.16125869750976562, -0.15576934814453125, -0.15027999877929688, -0.1447906494140625, -0.13930130004882812, -0.13381195068359375, -0.12832260131835938, -0.122833251953125, -0.11734390258789062, -0.11185455322265625, -0.10636520385742188, -0.1008758544921875, -0.09538650512695312, -0.08989715576171875, -0.08440780639648438, -0.07891845703125, -0.07342910766601562, -0.06793975830078125, -0.062450408935546875, -0.0569610595703125, -0.051471710205078125, -0.04598236083984375, -0.040493011474609375, -0.035003662109375, -0.029514312744140625, -0.02402496337890625, -0.018535614013671875, -0.0130462646484375, -0.007556915283203125, -0.00206756591796875, 0.003421783447265625, 0.0089111328125, 0.014400482177734375, 0.01988983154296875, 0.025379180908203125, 0.0308685302734375, 0.036357879638671875, 0.04184722900390625, 0.047336578369140625, 0.052825927734375, 0.058315277099609375, 0.06380462646484375, 0.06929397583007812, 0.0747833251953125, 0.08027267456054688, 0.08576202392578125, 0.09125137329101562, 0.09674072265625, 0.10223007202148438, 0.10771942138671875, 0.11320877075195312, 0.1186981201171875, 0.12418746948242188, 0.12967681884765625, 0.13516616821289062, 0.140655517578125, 0.14614486694335938, 0.15163421630859375, 0.15712356567382812, 0.1626129150390625, 0.16810226440429688, 0.17359161376953125, 0.17908096313476562, 0.1845703125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 8.0, 5.0, 14.0, 18.0, 60.0, 351.0, 16218.0, 1030879.0, 851.0, 90.0, 25.0, 15.0, 7.0, 3.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.921875, -25.30712890625, -24.6923828125, -24.07763671875, -23.462890625, -22.84814453125, -22.2333984375, -21.61865234375, -21.00390625, -20.38916015625, -19.7744140625, -19.15966796875, -18.544921875, -17.93017578125, -17.3154296875, -16.70068359375, -16.0859375, -15.47119140625, -14.8564453125, -14.24169921875, -13.626953125, -13.01220703125, -12.3974609375, -11.78271484375, -11.16796875, -10.55322265625, -9.9384765625, -9.32373046875, -8.708984375, -8.09423828125, -7.4794921875, -6.86474609375, -6.25, -5.63525390625, -5.0205078125, -4.40576171875, -3.791015625, -3.17626953125, -2.5615234375, -1.94677734375, -1.33203125, -0.71728515625, -0.1025390625, 0.51220703125, 1.126953125, 1.74169921875, 2.3564453125, 2.97119140625, 3.5859375, 4.20068359375, 4.8154296875, 5.43017578125, 6.044921875, 6.65966796875, 7.2744140625, 7.88916015625, 8.50390625, 9.11865234375, 9.7333984375, 10.34814453125, 10.962890625, 11.57763671875, 12.1923828125, 12.80712890625, 13.421875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 7.0, 9.0, 13.0, 21.0, 29.0, 61.0, 189.0, 455.0, 111.0, 31.0, 16.0, 19.0, 9.0, 9.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.000213623046875, -0.0002067945897579193, -0.00019996613264083862, -0.00019313767552375793, -0.00018630921840667725, -0.00017948076128959656, -0.00017265230417251587, -0.00016582384705543518, -0.0001589953899383545, -0.0001521669328212738, -0.00014533847570419312, -0.00013851001858711243, -0.00013168156147003174, -0.00012485310435295105, -0.00011802464723587036, -0.00011119619011878967, -0.00010436773300170898, -9.75392758846283e-05, -9.071081876754761e-05, -8.388236165046692e-05, -7.705390453338623e-05, -7.022544741630554e-05, -6.339699029922485e-05, -5.6568533182144165e-05, -4.9740076065063477e-05, -4.291161894798279e-05, -3.60831618309021e-05, -2.925470471382141e-05, -2.2426247596740723e-05, -1.5597790479660034e-05, -8.769333362579346e-06, -1.9408762454986572e-06, 4.887580871582031e-06, 1.171603798866272e-05, 1.8544495105743408e-05, 2.5372952222824097e-05, 3.2201409339904785e-05, 3.9029866456985474e-05, 4.585832357406616e-05, 5.268678069114685e-05, 5.951523780822754e-05, 6.634369492530823e-05, 7.317215204238892e-05, 8.00006091594696e-05, 8.682906627655029e-05, 9.365752339363098e-05, 0.00010048598051071167, 0.00010731443762779236, 0.00011414289474487305, 0.00012097135186195374, 0.00012779980897903442, 0.0001346282660961151, 0.0001414567232131958, 0.0001482851803302765, 0.00015511363744735718, 0.00016194209456443787, 0.00016877055168151855, 0.00017559900879859924, 0.00018242746591567993, 0.00018925592303276062, 0.0001960843801498413, 0.000202912837266922, 0.00020974129438400269, 0.00021656975150108337, 0.00022339820861816406]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 3.0, 2.0, 6.0, 5.0, 5.0, 20.0, 41.0, 149.0, 1378.0, 860510.0, 184777.0, 1380.0, 172.0, 50.0, 22.0, 11.0, 5.0, 7.0, 2.0, 1.0, 0.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0546875, -4.852294921875, -4.64990234375, -4.447509765625, -4.2451171875, -4.042724609375, -3.84033203125, -3.637939453125, -3.435546875, -3.233154296875, -3.03076171875, -2.828369140625, -2.6259765625, -2.423583984375, -2.22119140625, -2.018798828125, -1.81640625, -1.614013671875, -1.41162109375, -1.209228515625, -1.0068359375, -0.804443359375, -0.60205078125, -0.399658203125, -0.197265625, 0.005126953125, 0.20751953125, 0.409912109375, 0.6123046875, 0.814697265625, 1.01708984375, 1.219482421875, 1.421875, 1.624267578125, 1.82666015625, 2.029052734375, 2.2314453125, 2.433837890625, 2.63623046875, 2.838623046875, 3.041015625, 3.243408203125, 3.44580078125, 3.648193359375, 3.8505859375, 4.052978515625, 4.25537109375, 4.457763671875, 4.66015625, 4.862548828125, 5.06494140625, 5.267333984375, 5.4697265625, 5.672119140625, 5.87451171875, 6.076904296875, 6.279296875, 6.481689453125, 6.68408203125, 6.886474609375, 7.0888671875, 7.291259765625, 7.49365234375, 7.696044921875, 7.8984375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 7.0, 5.0, 5.0, 7.0, 15.0, 20.0, 31.0, 38.0, 67.0, 290.0, 282.0, 81.0, 46.0, 35.0, 19.0, 15.0, 5.0, 6.0, 7.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.374755859375, -0.3584632873535156, -0.34217071533203125, -0.3258781433105469, -0.3095855712890625, -0.2932929992675781, -0.27700042724609375, -0.2607078552246094, -0.244415283203125, -0.22812271118164062, -0.21183013916015625, -0.19553756713867188, -0.1792449951171875, -0.16295242309570312, -0.14665985107421875, -0.13036727905273438, -0.11407470703125, -0.09778213500976562, -0.08148956298828125, -0.06519699096679688, -0.0489044189453125, -0.032611846923828125, -0.01631927490234375, -2.6702880859375e-05, 0.016265869140625, 0.032558441162109375, 0.04885101318359375, 0.06514358520507812, 0.0814361572265625, 0.09772872924804688, 0.11402130126953125, 0.13031387329101562, 0.1466064453125, 0.16289901733398438, 0.17919158935546875, 0.19548416137695312, 0.2117767333984375, 0.22806930541992188, 0.24436187744140625, 0.2606544494628906, 0.276947021484375, 0.2932395935058594, 0.30953216552734375, 0.3258247375488281, 0.3421173095703125, 0.3584098815917969, 0.37470245361328125, 0.3909950256347656, 0.40728759765625, 0.4235801696777344, 0.43987274169921875, 0.4561653137207031, 0.4724578857421875, 0.4887504577636719, 0.5050430297851562, 0.5213356018066406, 0.537628173828125, 0.5539207458496094, 0.5702133178710938, 0.5865058898925781, 0.6027984619140625, 0.6190910339355469, 0.6353836059570312, 0.6516761779785156, 0.66796875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 36.0, 270.0, 553.0, 104.0, 24.0, 12.0, 7.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.51958465576172, -20.094493865966797, -19.669403076171875, -19.244312286376953, -18.81922149658203, -18.394132614135742, -17.96904182434082, -17.5439510345459, -17.118860244750977, -16.693769454956055, -16.268678665161133, -15.843588829040527, -15.418498039245605, -14.993407249450684, -14.568317413330078, -14.143226623535156, -13.718135833740234, -13.293045043945312, -12.86795425415039, -12.442864418029785, -12.017773628234863, -11.592682838439941, -11.167593002319336, -10.742502212524414, -10.317411422729492, -9.89232063293457, -9.467229843139648, -9.042140007019043, -8.617049217224121, -8.1919584274292, -7.7668681144714355, -7.341777801513672, -6.916686534881592, -6.491596221923828, -6.066505432128906, -5.641414642333984, -5.216324329376221, -4.791234016418457, -4.366143226623535, -3.9410526752471924, -3.5159621238708496, -3.090871572494507, -2.665781021118164, -2.2406904697418213, -1.8155999183654785, -1.3905093669891357, -0.965418815612793, -0.5403282642364502, -0.11523771286010742, 0.30985283851623535, 0.7349433898925781, 1.160033941268921, 1.5851244926452637, 2.0102150440216064, 2.435305595397949, 2.860396146774292, 3.2854866981506348, 3.7105772495269775, 4.13566780090332, 4.560758590698242, 4.985848903656006, 5.4109392166137695, 5.836030006408691, 6.261120796203613, 6.686211109161377]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 10.0, 8.0, 12.0, 20.0, 28.0, 43.0, 47.0, 74.0, 84.0, 90.0, 110.0, 90.0, 81.0, 90.0, 64.0, 43.0, 47.0, 19.0, 17.0, 14.0, 8.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.528778553009033, -2.4614713191986084, -2.3941640853881836, -2.326857089996338, -2.259549856185913, -2.1922426223754883, -2.1249356269836426, -2.0576283931732178, -1.990321159362793, -1.9230139255523682, -1.855706810951233, -1.7883996963500977, -1.7210924625396729, -1.653785228729248, -1.5864781141281128, -1.5191709995269775, -1.4518637657165527, -1.384556531906128, -1.3172494173049927, -1.2499423027038574, -1.1826350688934326, -1.1153278350830078, -1.0480207204818726, -0.9807135462760925, -0.9134063720703125, -0.8460991978645325, -0.7787920236587524, -0.7114848494529724, -0.6441776752471924, -0.5768705010414124, -0.5095633268356323, -0.4422561526298523, -0.37494921684265137, -0.30764204263687134, -0.2403348684310913, -0.17302769422531128, -0.10572052001953125, -0.03841334581375122, 0.02889382839202881, 0.09620100259780884, 0.16350817680358887, 0.2308153510093689, 0.2981225252151489, 0.36542969942092896, 0.432736873626709, 0.500044047832489, 0.567351222038269, 0.6346583962440491, 0.7019655704498291, 0.7692727446556091, 0.8365799188613892, 0.9038870930671692, 0.9711942672729492, 1.038501501083374, 1.1058086156845093, 1.1731157302856445, 1.2404229640960693, 1.3077301979064941, 1.3750373125076294, 1.4423444271087646, 1.5096516609191895, 1.5769588947296143, 1.6442660093307495, 1.7115731239318848, 1.7788803577423096]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 6.0, 2.0, 2.0, 0.0, 4.0, 4.0, 6.0, 8.0, 6.0, 4.0, 2.0, 12.0, 7.0, 26.0, 13.0, 24.0, 37.0, 82.0, 153.0, 343.0, 2331.0, 150423.0, 4032828.0, 6226.0, 942.0, 324.0, 139.0, 79.0, 65.0, 65.0, 36.0, 23.0, 18.0, 19.0, 13.0, 7.0, 2.0, 4.0, 0.0, 1.0, 1.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.62109375, -4.43719482421875, -4.2532958984375, -4.06939697265625, -3.885498046875, -3.70159912109375, -3.5177001953125, -3.33380126953125, -3.14990234375, -2.96600341796875, -2.7821044921875, -2.59820556640625, -2.414306640625, -2.23040771484375, -2.0465087890625, -1.86260986328125, -1.6787109375, -1.49481201171875, -1.3109130859375, -1.12701416015625, -0.943115234375, -0.75921630859375, -0.5753173828125, -0.39141845703125, -0.20751953125, -0.02362060546875, 0.1602783203125, 0.34417724609375, 0.528076171875, 0.71197509765625, 0.8958740234375, 1.07977294921875, 1.263671875, 1.44757080078125, 1.6314697265625, 1.81536865234375, 1.999267578125, 2.18316650390625, 2.3670654296875, 2.55096435546875, 2.73486328125, 2.91876220703125, 3.1026611328125, 3.28656005859375, 3.470458984375, 3.65435791015625, 3.8382568359375, 4.02215576171875, 4.2060546875, 4.38995361328125, 4.5738525390625, 4.75775146484375, 4.941650390625, 5.12554931640625, 5.3094482421875, 5.49334716796875, 5.67724609375, 5.86114501953125, 6.0450439453125, 6.22894287109375, 6.412841796875, 6.59674072265625, 6.7806396484375, 6.96453857421875, 7.1484375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 12.0, 12.0, 39.0, 66.0, 106.0, 166.0, 175.0, 175.0, 116.0, 64.0, 33.0, 17.0, 12.0, 4.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03741455078125, -0.03467845916748047, -0.03194236755371094, -0.029206275939941406, -0.026470184326171875, -0.023734092712402344, -0.020998001098632812, -0.01826190948486328, -0.01552581787109375, -0.012789726257324219, -0.010053634643554688, -0.007317543029785156, -0.004581451416015625, -0.0018453598022460938, 0.0008907318115234375, 0.0036268234252929688, 0.0063629150390625, 0.009099006652832031, 0.011835098266601562, 0.014571189880371094, 0.017307281494140625, 0.020043373107910156, 0.022779464721679688, 0.02551555633544922, 0.02825164794921875, 0.03098773956298828, 0.03372383117675781, 0.036459922790527344, 0.039196014404296875, 0.041932106018066406, 0.04466819763183594, 0.04740428924560547, 0.050140380859375, 0.05287647247314453, 0.05561256408691406, 0.058348655700683594, 0.061084747314453125, 0.06382083892822266, 0.06655693054199219, 0.06929302215576172, 0.07202911376953125, 0.07476520538330078, 0.07750129699707031, 0.08023738861083984, 0.08297348022460938, 0.0857095718383789, 0.08844566345214844, 0.09118175506591797, 0.0939178466796875, 0.09665393829345703, 0.09939002990722656, 0.1021261215209961, 0.10486221313476562, 0.10759830474853516, 0.11033439636230469, 0.11307048797607422, 0.11580657958984375, 0.11854267120361328, 0.12127876281738281, 0.12401485443115234, 0.12675094604492188, 0.1294870376586914, 0.13222312927246094, 0.13495922088623047, 0.1376953125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 10.0, 9.0, 8.0, 25.0, 46.0, 54.0, 88.0, 132.0, 186.0, 310.0, 690.0, 24587.0, 4161754.0, 5041.0, 471.0, 276.0, 186.0, 129.0, 86.0, 67.0, 33.0, 28.0, 26.0, 22.0, 7.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1171875, -10.811279296875, -10.50537109375, -10.199462890625, -9.8935546875, -9.587646484375, -9.28173828125, -8.975830078125, -8.669921875, -8.364013671875, -8.05810546875, -7.752197265625, -7.4462890625, -7.140380859375, -6.83447265625, -6.528564453125, -6.22265625, -5.916748046875, -5.61083984375, -5.304931640625, -4.9990234375, -4.693115234375, -4.38720703125, -4.081298828125, -3.775390625, -3.469482421875, -3.16357421875, -2.857666015625, -2.5517578125, -2.245849609375, -1.93994140625, -1.634033203125, -1.328125, -1.022216796875, -0.71630859375, -0.410400390625, -0.1044921875, 0.201416015625, 0.50732421875, 0.813232421875, 1.119140625, 1.425048828125, 1.73095703125, 2.036865234375, 2.3427734375, 2.648681640625, 2.95458984375, 3.260498046875, 3.56640625, 3.872314453125, 4.17822265625, 4.484130859375, 4.7900390625, 5.095947265625, 5.40185546875, 5.707763671875, 6.013671875, 6.319580078125, 6.62548828125, 6.931396484375, 7.2373046875, 7.543212890625, 7.84912109375, 8.155029296875, 8.4609375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 5.0, 10.0, 19.0, 29.0, 64.0, 82.0, 297.0, 3117.0, 286.0, 87.0, 31.0, 26.0, 18.0, 5.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1602783203125, -0.14630699157714844, -0.13233566284179688, -0.11836433410644531, -0.10439300537109375, -0.09042167663574219, -0.07645034790039062, -0.06247901916503906, -0.0485076904296875, -0.03453636169433594, -0.020565032958984375, -0.0065937042236328125, 0.00737762451171875, 0.021348953247070312, 0.035320281982421875, 0.04929161071777344, 0.063262939453125, 0.07723426818847656, 0.09120559692382812, 0.10517692565917969, 0.11914825439453125, 0.1331195831298828, 0.14709091186523438, 0.16106224060058594, 0.1750335693359375, 0.18900489807128906, 0.20297622680664062, 0.2169475555419922, 0.23091888427734375, 0.2448902130126953, 0.2588615417480469, 0.27283287048339844, 0.28680419921875, 0.30077552795410156, 0.3147468566894531, 0.3287181854248047, 0.34268951416015625, 0.3566608428955078, 0.3706321716308594, 0.38460350036621094, 0.3985748291015625, 0.41254615783691406, 0.4265174865722656, 0.4404888153076172, 0.45446014404296875, 0.4684314727783203, 0.4824028015136719, 0.49637413024902344, 0.510345458984375, 0.5243167877197266, 0.5382881164550781, 0.5522594451904297, 0.5662307739257812, 0.5802021026611328, 0.5941734313964844, 0.6081447601318359, 0.6221160888671875, 0.6360874176025391, 0.6500587463378906, 0.6640300750732422, 0.6780014038085938, 0.6919727325439453, 0.7059440612792969, 0.7199153900146484, 0.73388671875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 13.0, 41.0, 150.0, 623.0, 143.0, 25.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.153366088867188, -26.59396743774414, -26.034568786621094, -25.475170135498047, -24.915771484375, -24.35637092590332, -23.796972274780273, -23.237573623657227, -22.67817497253418, -22.118776321411133, -21.559377670288086, -20.99997901916504, -20.44057846069336, -19.881179809570312, -19.321781158447266, -18.76238250732422, -18.202983856201172, -17.643585205078125, -17.084186553955078, -16.52478790283203, -15.965388298034668, -15.405989646911621, -14.846590042114258, -14.287191390991211, -13.727792739868164, -13.168394088745117, -12.60899543762207, -12.049595832824707, -11.49019718170166, -10.930798530578613, -10.37139892578125, -9.812000274658203, -9.252603530883789, -8.693204879760742, -8.133806228637695, -7.574406623840332, -7.015007972717285, -6.455609321594238, -5.896210193634033, -5.336811065673828, -4.777412414550781, -4.218013763427734, -3.6586146354675293, -3.0992157459259033, -2.5398168563842773, -1.9804179668426514, -1.4210190773010254, -0.8616201877593994, -0.30222129821777344, 0.25717759132385254, 0.8165764808654785, 1.3759753704071045, 1.9353742599487305, 2.4947731494903564, 3.0541720390319824, 3.6135709285736084, 4.172969818115234, 4.732368469238281, 5.291767597198486, 5.851166725158691, 6.410565376281738, 6.969964027404785, 7.52936315536499, 8.088762283325195, 8.648160934448242]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 11.0, 16.0, 49.0, 103.0, 199.0, 258.0, 184.0, 122.0, 40.0, 24.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.749866008758545, -2.468902111053467, -2.1879382133483887, -1.9069744348526, -1.626010537147522, -1.3450466394424438, -1.0640828609466553, -0.7831189632415771, -0.502155065536499, -0.2211911976337433, 0.05977267026901245, 0.3407365083694458, 0.6217004060745239, 0.902664303779602, 1.1836280822753906, 1.4645919799804688, 1.7455558776855469, 2.026519775390625, 2.307483673095703, 2.5884475708007812, 2.8694114685058594, 3.1503753662109375, 3.4313390254974365, 3.7123029232025146, 3.9932668209075928, 4.274230480194092, 4.55519437789917, 4.836158275604248, 5.117122173309326, 5.398086071014404, 5.679049968719482, 5.9600138664245605, 6.240978240966797, 6.521942138671875, 6.802906036376953, 7.083869934082031, 7.364833831787109, 7.6457977294921875, 7.926761627197266, 8.207725524902344, 8.488689422607422, 8.7696533203125, 9.050617218017578, 9.331581115722656, 9.612545013427734, 9.893508911132812, 10.17447280883789, 10.455436706542969, 10.736400604248047, 11.017364501953125, 11.298328399658203, 11.579292297363281, 11.86025619506836, 12.141220092773438, 12.422183990478516, 12.703147888183594, 12.984110832214355, 13.265074729919434, 13.546038627624512, 13.82700252532959, 14.107966423034668, 14.388930320739746, 14.669894218444824, 14.950858116149902, 15.23182201385498]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 4.0, 8.0, 13.0, 9.0, 18.0, 13.0, 15.0, 17.0, 27.0, 21.0, 37.0, 28.0, 37.0, 32.0, 41.0, 50.0, 99.0, 1232.0, 1036965.0, 9304.0, 147.0, 73.0, 43.0, 51.0, 40.0, 32.0, 29.0, 29.0, 20.0, 35.0, 15.0, 9.0, 8.0, 8.0, 10.0, 4.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0], "bins": [-42.34375, -41.1220703125, -39.900390625, -38.6787109375, -37.45703125, -36.2353515625, -35.013671875, -33.7919921875, -32.5703125, -31.3486328125, -30.126953125, -28.9052734375, -27.68359375, -26.4619140625, -25.240234375, -24.0185546875, -22.796875, -21.5751953125, -20.353515625, -19.1318359375, -17.91015625, -16.6884765625, -15.466796875, -14.2451171875, -13.0234375, -11.8017578125, -10.580078125, -9.3583984375, -8.13671875, -6.9150390625, -5.693359375, -4.4716796875, -3.25, -2.0283203125, -0.806640625, 0.4150390625, 1.63671875, 2.8583984375, 4.080078125, 5.3017578125, 6.5234375, 7.7451171875, 8.966796875, 10.1884765625, 11.41015625, 12.6318359375, 13.853515625, 15.0751953125, 16.296875, 17.5185546875, 18.740234375, 19.9619140625, 21.18359375, 22.4052734375, 23.626953125, 24.8486328125, 26.0703125, 27.2919921875, 28.513671875, 29.7353515625, 30.95703125, 32.1787109375, 33.400390625, 34.6220703125, 35.84375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 18.0, 184.0, 578.0, 215.0, 14.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4326171875, -0.3667755126953125, -0.300933837890625, -0.2350921630859375, -0.16925048828125, -0.1034088134765625, -0.037567138671875, 0.0282745361328125, 0.0941162109375, 0.1599578857421875, 0.225799560546875, 0.2916412353515625, 0.35748291015625, 0.4233245849609375, 0.489166259765625, 0.5550079345703125, 0.620849609375, 0.6866912841796875, 0.752532958984375, 0.8183746337890625, 0.88421630859375, 0.9500579833984375, 1.015899658203125, 1.0817413330078125, 1.1475830078125, 1.2134246826171875, 1.279266357421875, 1.3451080322265625, 1.41094970703125, 1.4767913818359375, 1.542633056640625, 1.6084747314453125, 1.67431640625, 1.7401580810546875, 1.805999755859375, 1.8718414306640625, 1.93768310546875, 2.0035247802734375, 2.069366455078125, 2.1352081298828125, 2.2010498046875, 2.2668914794921875, 2.332733154296875, 2.3985748291015625, 2.46441650390625, 2.5302581787109375, 2.596099853515625, 2.6619415283203125, 2.727783203125, 2.7936248779296875, 2.859466552734375, 2.9253082275390625, 2.99114990234375, 3.0569915771484375, 3.122833251953125, 3.1886749267578125, 3.2545166015625, 3.3203582763671875, 3.386199951171875, 3.4520416259765625, 3.51788330078125, 3.5837249755859375, 3.649566650390625, 3.7154083251953125, 3.78125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 4.0, 9.0, 19.0, 23.0, 33.0, 43.0, 59.0, 81.0, 114.0, 188.0, 322.0, 497.0, 891.0, 1584.0, 3227.0, 7100.0, 18678.0, 62578.0, 299682.0, 496998.0, 108697.0, 28425.0, 10159.0, 4280.0, 2064.0, 1141.0, 595.0, 351.0, 220.0, 178.0, 85.0, 84.0, 50.0, 25.0, 17.0, 18.0, 10.0, 10.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.875, -7.6141357421875, -7.353271484375, -7.0924072265625, -6.83154296875, -6.5706787109375, -6.309814453125, -6.0489501953125, -5.7880859375, -5.5272216796875, -5.266357421875, -5.0054931640625, -4.74462890625, -4.4837646484375, -4.222900390625, -3.9620361328125, -3.701171875, -3.4403076171875, -3.179443359375, -2.9185791015625, -2.65771484375, -2.3968505859375, -2.135986328125, -1.8751220703125, -1.6142578125, -1.3533935546875, -1.092529296875, -0.8316650390625, -0.57080078125, -0.3099365234375, -0.049072265625, 0.2117919921875, 0.47265625, 0.7335205078125, 0.994384765625, 1.2552490234375, 1.51611328125, 1.7769775390625, 2.037841796875, 2.2987060546875, 2.5595703125, 2.8204345703125, 3.081298828125, 3.3421630859375, 3.60302734375, 3.8638916015625, 4.124755859375, 4.3856201171875, 4.646484375, 4.9073486328125, 5.168212890625, 5.4290771484375, 5.68994140625, 5.9508056640625, 6.211669921875, 6.4725341796875, 6.7333984375, 6.9942626953125, 7.255126953125, 7.5159912109375, 7.77685546875, 8.0377197265625, 8.298583984375, 8.5594482421875, 8.8203125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 3.0, 5.0, 6.0, 13.0, 8.0, 14.0, 17.0, 13.0, 25.0, 31.0, 35.0, 38.0, 43.0, 49.0, 47.0, 49.0, 65.0, 64.0, 63.0, 59.0, 55.0, 39.0, 43.0, 39.0, 39.0, 23.0, 21.0, 23.0, 14.0, 14.0, 10.0, 11.0, 5.0, 5.0, 6.0, 7.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.40625, -3.307586669921875, -3.20892333984375, -3.110260009765625, -3.0115966796875, -2.912933349609375, -2.81427001953125, -2.715606689453125, -2.616943359375, -2.518280029296875, -2.41961669921875, -2.320953369140625, -2.2222900390625, -2.123626708984375, -2.02496337890625, -1.926300048828125, -1.82763671875, -1.728973388671875, -1.63031005859375, -1.531646728515625, -1.4329833984375, -1.334320068359375, -1.23565673828125, -1.136993408203125, -1.038330078125, -0.939666748046875, -0.84100341796875, -0.742340087890625, -0.6436767578125, -0.545013427734375, -0.44635009765625, -0.347686767578125, -0.2490234375, -0.150360107421875, -0.05169677734375, 0.046966552734375, 0.1456298828125, 0.244293212890625, 0.34295654296875, 0.441619873046875, 0.540283203125, 0.638946533203125, 0.73760986328125, 0.836273193359375, 0.9349365234375, 1.033599853515625, 1.13226318359375, 1.230926513671875, 1.32958984375, 1.428253173828125, 1.52691650390625, 1.625579833984375, 1.7242431640625, 1.822906494140625, 1.92156982421875, 2.020233154296875, 2.118896484375, 2.217559814453125, 2.31622314453125, 2.414886474609375, 2.5135498046875, 2.612213134765625, 2.71087646484375, 2.809539794921875, 2.908203125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 7.0, 7.0, 9.0, 14.0, 17.0, 22.0, 36.0, 49.0, 49.0, 96.0, 144.0, 300.0, 580.0, 1418.0, 4992.0, 25498.0, 340391.0, 625982.0, 38886.0, 6677.0, 1846.0, 718.0, 322.0, 161.0, 95.0, 61.0, 44.0, 31.0, 29.0, 18.0, 18.0, 9.0, 4.0, 5.0, 5.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.28125, -11.873291015625, -11.46533203125, -11.057373046875, -10.6494140625, -10.241455078125, -9.83349609375, -9.425537109375, -9.017578125, -8.609619140625, -8.20166015625, -7.793701171875, -7.3857421875, -6.977783203125, -6.56982421875, -6.161865234375, -5.75390625, -5.345947265625, -4.93798828125, -4.530029296875, -4.1220703125, -3.714111328125, -3.30615234375, -2.898193359375, -2.490234375, -2.082275390625, -1.67431640625, -1.266357421875, -0.8583984375, -0.450439453125, -0.04248046875, 0.365478515625, 0.7734375, 1.181396484375, 1.58935546875, 1.997314453125, 2.4052734375, 2.813232421875, 3.22119140625, 3.629150390625, 4.037109375, 4.445068359375, 4.85302734375, 5.260986328125, 5.6689453125, 6.076904296875, 6.48486328125, 6.892822265625, 7.30078125, 7.708740234375, 8.11669921875, 8.524658203125, 8.9326171875, 9.340576171875, 9.74853515625, 10.156494140625, 10.564453125, 10.972412109375, 11.38037109375, 11.788330078125, 12.1962890625, 12.604248046875, 13.01220703125, 13.420166015625, 13.828125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 9.0, 12.0, 7.0, 12.0, 8.0, 14.0, 23.0, 34.0, 54.0, 69.0, 80.0, 119.0, 128.0, 128.0, 82.0, 73.0, 52.0, 28.0, 20.0, 11.0, 9.0, 9.0, 7.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0009403228759765625, -0.0009144619107246399, -0.0008886009454727173, -0.0008627399802207947, -0.0008368790149688721, -0.0008110180497169495, -0.0007851570844650269, -0.0007592961192131042, -0.0007334351539611816, -0.000707574188709259, -0.0006817132234573364, -0.0006558522582054138, -0.0006299912929534912, -0.0006041303277015686, -0.000578269362449646, -0.0005524083971977234, -0.0005265474319458008, -0.0005006864666938782, -0.00047482550144195557, -0.00044896453619003296, -0.00042310357093811035, -0.00039724260568618774, -0.00037138164043426514, -0.00034552067518234253, -0.0003196597099304199, -0.0002937987446784973, -0.0002679377794265747, -0.0002420768141746521, -0.0002162158489227295, -0.00019035488367080688, -0.00016449391841888428, -0.00013863295316696167, -0.00011277198791503906, -8.691102266311646e-05, -6.105005741119385e-05, -3.518909215927124e-05, -9.328126907348633e-06, 1.6532838344573975e-05, 4.239380359649658e-05, 6.825476884841919e-05, 9.41157341003418e-05, 0.0001199766993522644, 0.000145837664604187, 0.00017169862985610962, 0.00019755959510803223, 0.00022342056035995483, 0.00024928152561187744, 0.00027514249086380005, 0.00030100345611572266, 0.00032686442136764526, 0.00035272538661956787, 0.0003785863518714905, 0.0004044473171234131, 0.0004303082823753357, 0.0004561692476272583, 0.0004820302128791809, 0.0005078911781311035, 0.0005337521433830261, 0.0005596131086349487, 0.0005854740738868713, 0.0006113350391387939, 0.0006371960043907166, 0.0006630569696426392, 0.0006889179348945618, 0.0007147789001464844]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 7.0, 6.0, 3.0, 2.0, 3.0, 5.0, 3.0, 9.0, 7.0, 14.0, 13.0, 27.0, 31.0, 73.0, 114.0, 197.0, 430.0, 1198.0, 4836.0, 37116.0, 861608.0, 130065.0, 9464.0, 2044.0, 651.0, 265.0, 119.0, 78.0, 53.0, 35.0, 20.0, 19.0, 12.0, 12.0, 10.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.78125, -12.3358154296875, -11.890380859375, -11.4449462890625, -10.99951171875, -10.5540771484375, -10.108642578125, -9.6632080078125, -9.2177734375, -8.7723388671875, -8.326904296875, -7.8814697265625, -7.43603515625, -6.9906005859375, -6.545166015625, -6.0997314453125, -5.654296875, -5.2088623046875, -4.763427734375, -4.3179931640625, -3.87255859375, -3.4271240234375, -2.981689453125, -2.5362548828125, -2.0908203125, -1.6453857421875, -1.199951171875, -0.7545166015625, -0.30908203125, 0.1363525390625, 0.581787109375, 1.0272216796875, 1.47265625, 1.9180908203125, 2.363525390625, 2.8089599609375, 3.25439453125, 3.6998291015625, 4.145263671875, 4.5906982421875, 5.0361328125, 5.4815673828125, 5.927001953125, 6.3724365234375, 6.81787109375, 7.2633056640625, 7.708740234375, 8.1541748046875, 8.599609375, 9.0450439453125, 9.490478515625, 9.9359130859375, 10.38134765625, 10.8267822265625, 11.272216796875, 11.7176513671875, 12.1630859375, 12.6085205078125, 13.053955078125, 13.4993896484375, 13.94482421875, 14.3902587890625, 14.835693359375, 15.2811279296875, 15.7265625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 7.0, 3.0, 3.0, 2.0, 5.0, 11.0, 7.0, 17.0, 19.0, 36.0, 27.0, 46.0, 71.0, 104.0, 102.0, 109.0, 73.0, 88.0, 84.0, 44.0, 31.0, 28.0, 24.0, 17.0, 9.0, 10.0, 7.0, 3.0, 2.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.359375, -3.23785400390625, -3.1163330078125, -2.99481201171875, -2.873291015625, -2.75177001953125, -2.6302490234375, -2.50872802734375, -2.38720703125, -2.26568603515625, -2.1441650390625, -2.02264404296875, -1.901123046875, -1.77960205078125, -1.6580810546875, -1.53656005859375, -1.4150390625, -1.29351806640625, -1.1719970703125, -1.05047607421875, -0.928955078125, -0.80743408203125, -0.6859130859375, -0.56439208984375, -0.44287109375, -0.32135009765625, -0.1998291015625, -0.07830810546875, 0.043212890625, 0.16473388671875, 0.2862548828125, 0.40777587890625, 0.529296875, 0.65081787109375, 0.7723388671875, 0.89385986328125, 1.015380859375, 1.13690185546875, 1.2584228515625, 1.37994384765625, 1.50146484375, 1.62298583984375, 1.7445068359375, 1.86602783203125, 1.987548828125, 2.10906982421875, 2.2305908203125, 2.35211181640625, 2.4736328125, 2.59515380859375, 2.7166748046875, 2.83819580078125, 2.959716796875, 3.08123779296875, 3.2027587890625, 3.32427978515625, 3.44580078125, 3.56732177734375, 3.6888427734375, 3.81036376953125, 3.931884765625, 4.05340576171875, 4.1749267578125, 4.29644775390625, 4.41796875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 45.0, 444.0, 458.0, 39.0, 10.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.59475708007812, -103.68004608154297, -96.76532745361328, -89.85061645507812, -82.93589782714844, -76.02118682861328, -69.10647583007812, -62.1917610168457, -55.27704620361328, -48.36233139038086, -41.44761657714844, -34.53290557861328, -27.61819076538086, -20.703475952148438, -13.788764953613281, -6.874050140380859, 0.0406646728515625, 6.955378532409668, 13.870092391967773, 20.784805297851562, 27.699520111083984, 34.614234924316406, 41.52894592285156, 48.443660736083984, 55.358375549316406, 62.27309036254883, 69.18780517578125, 76.1025161743164, 83.01722717285156, 89.93194580078125, 96.8466567993164, 103.76136779785156, 110.67608642578125, 117.5907974243164, 124.5055160522461, 131.42022705078125, 138.33494567871094, 145.24966430664062, 152.16436767578125, 159.07908630371094, 165.99380493164062, 172.9085235595703, 179.82322692871094, 186.73794555664062, 193.6526641845703, 200.5673828125, 207.48208618164062, 214.3968048095703, 221.31150817871094, 228.22622680664062, 235.14093017578125, 242.05564880371094, 248.97036743164062, 255.88507080078125, 262.7998046875, 269.7145080566406, 276.62921142578125, 283.5439147949219, 290.4586486816406, 297.37335205078125, 304.2880554199219, 311.2027893066406, 318.11749267578125, 325.0321960449219, 331.9469299316406]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 4.0, 15.0, 15.0, 10.0, 17.0, 22.0, 23.0, 31.0, 32.0, 39.0, 53.0, 50.0, 68.0, 50.0, 50.0, 55.0, 58.0, 54.0, 56.0, 61.0, 39.0, 32.0, 25.0, 28.0, 23.0, 14.0, 19.0, 13.0, 14.0, 9.0, 6.0, 3.0, 0.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-22.326953887939453, -21.646638870239258, -20.966323852539062, -20.286008834838867, -19.605693817138672, -18.92538070678711, -18.245065689086914, -17.56475067138672, -16.884435653686523, -16.204120635986328, -15.523805618286133, -14.843491554260254, -14.163176536560059, -13.482861518859863, -12.802547454833984, -12.122232437133789, -11.441917419433594, -10.761602401733398, -10.081287384033203, -9.400973320007324, -8.720658302307129, -8.040343284606934, -7.3600287437438965, -6.679714202880859, -5.999399185180664, -5.319084167480469, -4.638769626617432, -3.9584548473358154, -3.278140068054199, -2.597825288772583, -1.9175105094909668, -1.2371959686279297, -0.5568828582763672, 0.12343192100524902, 0.8037467002868652, 1.4840614795684814, 2.1643762588500977, 2.844691038131714, 3.52500581741333, 4.205320358276367, 4.8856353759765625, 5.565950393676758, 6.246264934539795, 6.926579475402832, 7.606894493103027, 8.287209510803223, 8.967523574829102, 9.647838592529297, 10.328153610229492, 11.008468627929688, 11.688783645629883, 12.369097709655762, 13.049412727355957, 13.729727745056152, 14.410041809082031, 15.090356826782227, 15.770671844482422, 16.450986862182617, 17.131301879882812, 17.811616897583008, 18.491931915283203, 19.172245025634766, 19.85256004333496, 20.532875061035156, 21.21319007873535]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 4.0, 8.0, 10.0, 15.0, 33.0, 63.0, 267.0, 9184.0, 4182996.0, 1099.0, 245.0, 122.0, 87.0, 48.0, 38.0, 21.0, 24.0, 8.0, 7.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.28125, -47.19287109375, -44.1044921875, -41.01611328125, -37.927734375, -34.83935546875, -31.7509765625, -28.66259765625, -25.57421875, -22.48583984375, -19.3974609375, -16.30908203125, -13.220703125, -10.13232421875, -7.0439453125, -3.95556640625, -0.8671875, 2.22119140625, 5.3095703125, 8.39794921875, 11.486328125, 14.57470703125, 17.6630859375, 20.75146484375, 23.83984375, 26.92822265625, 30.0166015625, 33.10498046875, 36.193359375, 39.28173828125, 42.3701171875, 45.45849609375, 48.546875, 51.63525390625, 54.7236328125, 57.81201171875, 60.900390625, 63.98876953125, 67.0771484375, 70.16552734375, 73.25390625, 76.34228515625, 79.4306640625, 82.51904296875, 85.607421875, 88.69580078125, 91.7841796875, 94.87255859375, 97.9609375, 101.04931640625, 104.1376953125, 107.22607421875, 110.314453125, 113.40283203125, 116.4912109375, 119.57958984375, 122.66796875, 125.75634765625, 128.8447265625, 131.93310546875, 135.021484375, 138.10986328125, 141.1982421875, 144.28662109375, 147.375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 38.0, 103.0, 237.0, 294.0, 202.0, 92.0, 31.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71142578125, -0.6434249877929688, -0.5754241943359375, -0.5074234008789062, -0.439422607421875, -0.37142181396484375, -0.3034210205078125, -0.23542022705078125, -0.16741943359375, -0.09941864013671875, -0.0314178466796875, 0.03658294677734375, 0.104583740234375, 0.17258453369140625, 0.2405853271484375, 0.30858612060546875, 0.3765869140625, 0.44458770751953125, 0.5125885009765625, 0.5805892944335938, 0.648590087890625, 0.7165908813476562, 0.7845916748046875, 0.8525924682617188, 0.92059326171875, 0.9885940551757812, 1.0565948486328125, 1.1245956420898438, 1.192596435546875, 1.2605972290039062, 1.3285980224609375, 1.3965988159179688, 1.464599609375, 1.5326004028320312, 1.6006011962890625, 1.6686019897460938, 1.736602783203125, 1.8046035766601562, 1.8726043701171875, 1.9406051635742188, 2.00860595703125, 2.0766067504882812, 2.1446075439453125, 2.2126083374023438, 2.280609130859375, 2.3486099243164062, 2.4166107177734375, 2.4846115112304688, 2.5526123046875, 2.6206130981445312, 2.6886138916015625, 2.7566146850585938, 2.824615478515625, 2.8926162719726562, 2.9606170654296875, 3.0286178588867188, 3.09661865234375, 3.1646194458007812, 3.2326202392578125, 3.3006210327148438, 3.368621826171875, 3.4366226196289062, 3.5046234130859375, 3.5726242065429688, 3.640625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 6.0, 17.0, 26.0, 48.0, 79.0, 114.0, 125.0, 200.0, 312.0, 5362.0, 4185779.0, 1456.0, 279.0, 181.0, 112.0, 65.0, 48.0, 28.0, 20.0, 8.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-162.25, -157.53125, -152.8125, -148.09375, -143.375, -138.65625, -133.9375, -129.21875, -124.5, -119.78125, -115.0625, -110.34375, -105.625, -100.90625, -96.1875, -91.46875, -86.75, -82.03125, -77.3125, -72.59375, -67.875, -63.15625, -58.4375, -53.71875, -49.0, -44.28125, -39.5625, -34.84375, -30.125, -25.40625, -20.6875, -15.96875, -11.25, -6.53125, -1.8125, 2.90625, 7.625, 12.34375, 17.0625, 21.78125, 26.5, 31.21875, 35.9375, 40.65625, 45.375, 50.09375, 54.8125, 59.53125, 64.25, 68.96875, 73.6875, 78.40625, 83.125, 87.84375, 92.5625, 97.28125, 102.0, 106.71875, 111.4375, 116.15625, 120.875, 125.59375, 130.3125, 135.03125, 139.75]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 13.0, 12.0, 47.0, 115.0, 706.0, 2973.0, 158.0, 39.0, 14.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0234375, -13.75982666015625, -13.4962158203125, -13.23260498046875, -12.968994140625, -12.70538330078125, -12.4417724609375, -12.17816162109375, -11.91455078125, -11.65093994140625, -11.3873291015625, -11.12371826171875, -10.860107421875, -10.59649658203125, -10.3328857421875, -10.06927490234375, -9.8056640625, -9.54205322265625, -9.2784423828125, -9.01483154296875, -8.751220703125, -8.48760986328125, -8.2239990234375, -7.96038818359375, -7.69677734375, -7.43316650390625, -7.1695556640625, -6.90594482421875, -6.642333984375, -6.37872314453125, -6.1151123046875, -5.85150146484375, -5.587890625, -5.32427978515625, -5.0606689453125, -4.79705810546875, -4.533447265625, -4.26983642578125, -4.0062255859375, -3.74261474609375, -3.47900390625, -3.21539306640625, -2.9517822265625, -2.68817138671875, -2.424560546875, -2.16094970703125, -1.8973388671875, -1.63372802734375, -1.3701171875, -1.10650634765625, -0.8428955078125, -0.57928466796875, -0.315673828125, -0.05206298828125, 0.2115478515625, 0.47515869140625, 0.73876953125, 1.00238037109375, 1.2659912109375, 1.52960205078125, 1.793212890625, 2.05682373046875, 2.3204345703125, 2.58404541015625, 2.84765625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 28.0, 109.0, 685.0, 151.0, 19.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-189.99972534179688, -184.50506591796875, -179.01040649414062, -173.51573181152344, -168.0210723876953, -162.5264129638672, -157.03175354003906, -151.53707885742188, -146.04241943359375, -140.54776000976562, -135.0531005859375, -129.5584259033203, -124.06376647949219, -118.56910705566406, -113.07444763183594, -107.57978057861328, -102.08512115478516, -96.59046173095703, -91.09579467773438, -85.60113525390625, -80.1064682006836, -74.61180877685547, -69.11714172363281, -63.62248229980469, -58.1278190612793, -52.633155822753906, -47.138492584228516, -41.643829345703125, -36.149169921875, -30.654504776000977, -25.15984344482422, -19.665180206298828, -14.170516967773438, -8.675853729248047, -3.1811914443969727, 2.3134708404541016, 7.808134078979492, 13.302797317504883, 18.79745864868164, 24.29212188720703, 29.786785125732422, 35.28144836425781, 40.7761116027832, 46.270774841308594, 51.76543426513672, 57.260101318359375, 62.7547607421875, 68.24942016601562, 73.74408721923828, 79.2387466430664, 84.73341369628906, 90.22807312011719, 95.72274017333984, 101.21739959716797, 106.71206665039062, 112.20672607421875, 117.70138549804688, 123.196044921875, 128.69070434570312, 134.1853790283203, 139.68003845214844, 145.17469787597656, 150.6693572998047, 156.16403198242188, 161.65869140625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 10.0, 11.0, 23.0, 30.0, 50.0, 68.0, 76.0, 105.0, 104.0, 111.0, 96.0, 78.0, 68.0, 74.0, 49.0, 26.0, 12.0, 9.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.698463439941406, -22.957927703857422, -22.217391967773438, -21.47685432434082, -20.736318588256836, -19.99578285217285, -19.255245208740234, -18.51470947265625, -17.774173736572266, -17.03363800048828, -16.293102264404297, -15.55256462097168, -14.812028884887695, -14.071493148803711, -13.33095645904541, -12.59041976928711, -11.849884033203125, -11.10934829711914, -10.36881160736084, -9.628274917602539, -8.887739181518555, -8.14720344543457, -7.4066667556762695, -6.666130542755127, -5.925594329833984, -5.185058116912842, -4.444521903991699, -3.7039856910705566, -2.963449478149414, -2.2229132652282715, -1.482377052307129, -0.7418408393859863, -0.00130462646484375, 0.7392315864562988, 1.4797677993774414, 2.220304012298584, 2.9608402252197266, 3.701376438140869, 4.441912651062012, 5.182448863983154, 5.922985076904297, 6.6635212898254395, 7.404057502746582, 8.144594192504883, 8.885129928588867, 9.625665664672852, 10.366202354431152, 11.106739044189453, 11.847274780273438, 12.587810516357422, 13.328347206115723, 14.068883895874023, 14.809419631958008, 15.549955368041992, 16.29049301147461, 17.031028747558594, 17.771564483642578, 18.512100219726562, 19.252635955810547, 19.993173599243164, 20.73370933532715, 21.474245071411133, 22.21478271484375, 22.955318450927734, 23.69585418701172]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 6.0, 17.0, 18.0, 16.0, 34.0, 49.0, 82.0, 163.0, 436.0, 1938.0, 27816.0, 967923.0, 46646.0, 2473.0, 514.0, 161.0, 75.0, 43.0, 38.0, 27.0, 30.0, 14.0, 13.0, 3.0, 4.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.5, -62.51904296875, -60.5380859375, -58.55712890625, -56.576171875, -54.59521484375, -52.6142578125, -50.63330078125, -48.65234375, -46.67138671875, -44.6904296875, -42.70947265625, -40.728515625, -38.74755859375, -36.7666015625, -34.78564453125, -32.8046875, -30.82373046875, -28.8427734375, -26.86181640625, -24.880859375, -22.89990234375, -20.9189453125, -18.93798828125, -16.95703125, -14.97607421875, -12.9951171875, -11.01416015625, -9.033203125, -7.05224609375, -5.0712890625, -3.09033203125, -1.109375, 0.87158203125, 2.8525390625, 4.83349609375, 6.814453125, 8.79541015625, 10.7763671875, 12.75732421875, 14.73828125, 16.71923828125, 18.7001953125, 20.68115234375, 22.662109375, 24.64306640625, 26.6240234375, 28.60498046875, 30.5859375, 32.56689453125, 34.5478515625, 36.52880859375, 38.509765625, 40.49072265625, 42.4716796875, 44.45263671875, 46.43359375, 48.41455078125, 50.3955078125, 52.37646484375, 54.357421875, 56.33837890625, 58.3193359375, 60.30029296875, 62.28125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 10.0, 7.0, 26.0, 47.0, 54.0, 92.0, 137.0, 144.0, 127.0, 137.0, 73.0, 62.0, 41.0, 26.0, 7.0, 8.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0087890625, -0.9490203857421875, -0.889251708984375, -0.8294830322265625, -0.76971435546875, -0.7099456787109375, -0.650177001953125, -0.5904083251953125, -0.5306396484375, -0.4708709716796875, -0.411102294921875, -0.3513336181640625, -0.29156494140625, -0.2317962646484375, -0.172027587890625, -0.1122589111328125, -0.052490234375, 0.0072784423828125, 0.067047119140625, 0.1268157958984375, 0.18658447265625, 0.2463531494140625, 0.306121826171875, 0.3658905029296875, 0.4256591796875, 0.4854278564453125, 0.545196533203125, 0.6049652099609375, 0.66473388671875, 0.7245025634765625, 0.784271240234375, 0.8440399169921875, 0.90380859375, 0.9635772705078125, 1.023345947265625, 1.0831146240234375, 1.14288330078125, 1.2026519775390625, 1.262420654296875, 1.3221893310546875, 1.3819580078125, 1.4417266845703125, 1.501495361328125, 1.5612640380859375, 1.62103271484375, 1.6808013916015625, 1.740570068359375, 1.8003387451171875, 1.860107421875, 1.9198760986328125, 1.979644775390625, 2.0394134521484375, 2.09918212890625, 2.1589508056640625, 2.218719482421875, 2.2784881591796875, 2.3382568359375, 2.3980255126953125, 2.457794189453125, 2.5175628662109375, 2.57733154296875, 2.6371002197265625, 2.696868896484375, 2.7566375732421875, 2.81640625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 8.0, 5.0, 10.0, 18.0, 21.0, 22.0, 35.0, 39.0, 58.0, 101.0, 132.0, 192.0, 279.0, 512.0, 835.0, 1693.0, 3940.0, 11453.0, 45900.0, 292888.0, 556014.0, 102275.0, 20578.0, 6177.0, 2466.0, 1148.0, 590.0, 364.0, 253.0, 171.0, 98.0, 75.0, 50.0, 36.0, 36.0, 24.0, 16.0, 16.0, 9.0, 5.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.875, -16.43359375, -15.9921875, -15.55078125, -15.109375, -14.66796875, -14.2265625, -13.78515625, -13.34375, -12.90234375, -12.4609375, -12.01953125, -11.578125, -11.13671875, -10.6953125, -10.25390625, -9.8125, -9.37109375, -8.9296875, -8.48828125, -8.046875, -7.60546875, -7.1640625, -6.72265625, -6.28125, -5.83984375, -5.3984375, -4.95703125, -4.515625, -4.07421875, -3.6328125, -3.19140625, -2.75, -2.30859375, -1.8671875, -1.42578125, -0.984375, -0.54296875, -0.1015625, 0.33984375, 0.78125, 1.22265625, 1.6640625, 2.10546875, 2.546875, 2.98828125, 3.4296875, 3.87109375, 4.3125, 4.75390625, 5.1953125, 5.63671875, 6.078125, 6.51953125, 6.9609375, 7.40234375, 7.84375, 8.28515625, 8.7265625, 9.16796875, 9.609375, 10.05078125, 10.4921875, 10.93359375, 11.375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 3.0, 8.0, 8.0, 5.0, 13.0, 10.0, 14.0, 24.0, 26.0, 30.0, 36.0, 51.0, 47.0, 46.0, 41.0, 53.0, 47.0, 49.0, 53.0, 45.0, 48.0, 47.0, 38.0, 43.0, 43.0, 22.0, 26.0, 22.0, 24.0, 12.0, 17.0, 9.0, 9.0, 10.0, 5.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5, -4.370361328125, -4.24072265625, -4.111083984375, -3.9814453125, -3.851806640625, -3.72216796875, -3.592529296875, -3.462890625, -3.333251953125, -3.20361328125, -3.073974609375, -2.9443359375, -2.814697265625, -2.68505859375, -2.555419921875, -2.42578125, -2.296142578125, -2.16650390625, -2.036865234375, -1.9072265625, -1.777587890625, -1.64794921875, -1.518310546875, -1.388671875, -1.259033203125, -1.12939453125, -0.999755859375, -0.8701171875, -0.740478515625, -0.61083984375, -0.481201171875, -0.3515625, -0.221923828125, -0.09228515625, 0.037353515625, 0.1669921875, 0.296630859375, 0.42626953125, 0.555908203125, 0.685546875, 0.815185546875, 0.94482421875, 1.074462890625, 1.2041015625, 1.333740234375, 1.46337890625, 1.593017578125, 1.72265625, 1.852294921875, 1.98193359375, 2.111572265625, 2.2412109375, 2.370849609375, 2.50048828125, 2.630126953125, 2.759765625, 2.889404296875, 3.01904296875, 3.148681640625, 3.2783203125, 3.407958984375, 3.53759765625, 3.667236328125, 3.796875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 2.0, 11.0, 4.0, 9.0, 15.0, 19.0, 42.0, 93.0, 186.0, 491.0, 1806.0, 17558.0, 992660.0, 32109.0, 2519.0, 555.0, 234.0, 95.0, 47.0, 31.0, 23.0, 14.0, 12.0, 4.0, 4.0, 1.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.75, -47.25390625, -45.7578125, -44.26171875, -42.765625, -41.26953125, -39.7734375, -38.27734375, -36.78125, -35.28515625, -33.7890625, -32.29296875, -30.796875, -29.30078125, -27.8046875, -26.30859375, -24.8125, -23.31640625, -21.8203125, -20.32421875, -18.828125, -17.33203125, -15.8359375, -14.33984375, -12.84375, -11.34765625, -9.8515625, -8.35546875, -6.859375, -5.36328125, -3.8671875, -2.37109375, -0.875, 0.62109375, 2.1171875, 3.61328125, 5.109375, 6.60546875, 8.1015625, 9.59765625, 11.09375, 12.58984375, 14.0859375, 15.58203125, 17.078125, 18.57421875, 20.0703125, 21.56640625, 23.0625, 24.55859375, 26.0546875, 27.55078125, 29.046875, 30.54296875, 32.0390625, 33.53515625, 35.03125, 36.52734375, 38.0234375, 39.51953125, 41.015625, 42.51171875, 44.0078125, 45.50390625, 47.0]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 7.0, 13.0, 24.0, 43.0, 110.0, 226.0, 258.0, 181.0, 78.0, 28.0, 17.0, 8.0, 9.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002361297607421875, -0.0022718310356140137, -0.0021823644638061523, -0.002092897891998291, -0.0020034313201904297, -0.0019139647483825684, -0.001824498176574707, -0.0017350316047668457, -0.0016455650329589844, -0.001556098461151123, -0.0014666318893432617, -0.0013771653175354004, -0.001287698745727539, -0.0011982321739196777, -0.0011087656021118164, -0.001019299030303955, -0.0009298324584960938, -0.0008403658866882324, -0.0007508993148803711, -0.0006614327430725098, -0.0005719661712646484, -0.0004824995994567871, -0.0003930330276489258, -0.00030356645584106445, -0.00021409988403320312, -0.0001246333122253418, -3.516674041748047e-05, 5.429983139038086e-05, 0.0001437664031982422, 0.00023323297500610352, 0.00032269954681396484, 0.00041216611862182617, 0.0005016326904296875, 0.0005910992622375488, 0.0006805658340454102, 0.0007700324058532715, 0.0008594989776611328, 0.0009489655494689941, 0.0010384321212768555, 0.0011278986930847168, 0.0012173652648925781, 0.0013068318367004395, 0.0013962984085083008, 0.0014857649803161621, 0.0015752315521240234, 0.0016646981239318848, 0.001754164695739746, 0.0018436312675476074, 0.0019330978393554688, 0.00202256441116333, 0.0021120309829711914, 0.0022014975547790527, 0.002290964126586914, 0.0023804306983947754, 0.0024698972702026367, 0.002559363842010498, 0.0026488304138183594, 0.0027382969856262207, 0.002827763557434082, 0.0029172301292419434, 0.0030066967010498047, 0.003096163272857666, 0.0031856298446655273, 0.0032750964164733887, 0.00336456298828125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 8.0, 2.0, 4.0, 4.0, 3.0, 13.0, 14.0, 21.0, 44.0, 48.0, 98.0, 239.0, 629.0, 2643.0, 31339.0, 990343.0, 19964.0, 2140.0, 567.0, 226.0, 89.0, 43.0, 29.0, 14.0, 7.0, 5.0, 3.0, 3.0, 4.0, 7.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.8125, -40.6650390625, -39.517578125, -38.3701171875, -37.22265625, -36.0751953125, -34.927734375, -33.7802734375, -32.6328125, -31.4853515625, -30.337890625, -29.1904296875, -28.04296875, -26.8955078125, -25.748046875, -24.6005859375, -23.453125, -22.3056640625, -21.158203125, -20.0107421875, -18.86328125, -17.7158203125, -16.568359375, -15.4208984375, -14.2734375, -13.1259765625, -11.978515625, -10.8310546875, -9.68359375, -8.5361328125, -7.388671875, -6.2412109375, -5.09375, -3.9462890625, -2.798828125, -1.6513671875, -0.50390625, 0.6435546875, 1.791015625, 2.9384765625, 4.0859375, 5.2333984375, 6.380859375, 7.5283203125, 8.67578125, 9.8232421875, 10.970703125, 12.1181640625, 13.265625, 14.4130859375, 15.560546875, 16.7080078125, 17.85546875, 19.0029296875, 20.150390625, 21.2978515625, 22.4453125, 23.5927734375, 24.740234375, 25.8876953125, 27.03515625, 28.1826171875, 29.330078125, 30.4775390625, 31.625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 5.0, 3.0, 3.0, 11.0, 5.0, 11.0, 21.0, 23.0, 41.0, 63.0, 138.0, 200.0, 189.0, 122.0, 66.0, 32.0, 25.0, 11.0, 6.0, 12.0, 3.0, 3.0, 1.0, 0.0, 1.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.671875, -10.357421875, -10.04296875, -9.728515625, -9.4140625, -9.099609375, -8.78515625, -8.470703125, -8.15625, -7.841796875, -7.52734375, -7.212890625, -6.8984375, -6.583984375, -6.26953125, -5.955078125, -5.640625, -5.326171875, -5.01171875, -4.697265625, -4.3828125, -4.068359375, -3.75390625, -3.439453125, -3.125, -2.810546875, -2.49609375, -2.181640625, -1.8671875, -1.552734375, -1.23828125, -0.923828125, -0.609375, -0.294921875, 0.01953125, 0.333984375, 0.6484375, 0.962890625, 1.27734375, 1.591796875, 1.90625, 2.220703125, 2.53515625, 2.849609375, 3.1640625, 3.478515625, 3.79296875, 4.107421875, 4.421875, 4.736328125, 5.05078125, 5.365234375, 5.6796875, 5.994140625, 6.30859375, 6.623046875, 6.9375, 7.251953125, 7.56640625, 7.880859375, 8.1953125, 8.509765625, 8.82421875, 9.138671875, 9.453125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 15.0, 20.0, 60.0, 99.0, 214.0, 262.0, 178.0, 83.0, 28.0, 22.0, 8.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.11685943603516, -107.44845581054688, -103.78005981445312, -100.11165618896484, -96.44325256347656, -92.77485656738281, -89.10645294189453, -85.43804931640625, -81.7696533203125, -78.10124969482422, -74.43285369873047, -70.76445007324219, -67.09605407714844, -63.427650451660156, -59.759246826171875, -56.09084701538086, -52.422447204589844, -48.75404739379883, -45.08564758300781, -41.41724395751953, -37.748844146728516, -34.0804443359375, -30.41204261779785, -26.743640899658203, -23.075241088867188, -19.406841278076172, -15.738439559936523, -12.070038795471191, -8.40163803100586, -4.733238220214844, -1.0648365020751953, 2.603565216064453, 6.27197265625, 9.940373420715332, 13.608774185180664, 17.277175903320312, 20.945575714111328, 24.613975524902344, 28.282377243041992, 31.95077896118164, 35.619178771972656, 39.28757858276367, 42.95597839355469, 46.62438201904297, 50.292781829833984, 53.961181640625, 57.62958526611328, 61.2979850769043, 64.96638488769531, 68.6347885131836, 72.30318450927734, 75.97158813476562, 79.63998413085938, 83.30838775634766, 86.97679138183594, 90.64518737792969, 94.31359100341797, 97.98199462890625, 101.650390625, 105.31879425048828, 108.98719787597656, 112.65559387207031, 116.3239974975586, 119.99240112304688, 123.66079711914062]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 5.0, 3.0, 4.0, 12.0, 7.0, 17.0, 20.0, 21.0, 18.0, 30.0, 40.0, 34.0, 35.0, 44.0, 39.0, 46.0, 49.0, 53.0, 52.0, 53.0, 40.0, 55.0, 56.0, 46.0, 44.0, 34.0, 26.0, 32.0, 16.0, 18.0, 19.0, 11.0, 8.0, 8.0, 6.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.139827728271484, -27.078466415405273, -26.01710319519043, -24.95574188232422, -23.894378662109375, -22.833017349243164, -21.771656036376953, -20.71029281616211, -19.6489315032959, -18.587570190429688, -17.526206970214844, -16.464845657348633, -15.403483390808105, -14.342121124267578, -13.280759811401367, -12.21939754486084, -11.158035278320312, -10.096673011779785, -9.035310745239258, -7.973949432373047, -6.9125871658325195, -5.851224899291992, -4.789863109588623, -3.728501319885254, -2.6671390533447266, -1.6057770252227783, -0.5444149971008301, 0.5169470310211182, 1.5783090591430664, 2.6396713256835938, 3.701033115386963, 4.762394905090332, 5.823753356933594, 6.885115623474121, 7.94647741317749, 9.00783920288086, 10.069201469421387, 11.130563735961914, 12.191925048828125, 13.253287315368652, 14.31464958190918, 15.376011848449707, 16.437374114990234, 17.498735427856445, 18.560096740722656, 19.6214599609375, 20.68282127380371, 21.744182586669922, 22.805545806884766, 23.866907119750977, 24.92827033996582, 25.98963165283203, 27.050994873046875, 28.112356185913086, 29.173717498779297, 30.23508071899414, 31.29644203186035, 32.35780334472656, 33.419166564941406, 34.48052978515625, 35.54188919067383, 36.60325241088867, 37.664615631103516, 38.725975036621094, 39.78733825683594]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 6.0, 8.0, 1.0, 9.0, 15.0, 12.0, 26.0, 36.0, 55.0, 69.0, 189.0, 513.0, 1532.0, 8752.0, 244267.0, 3905938.0, 28454.0, 2869.0, 725.0, 297.0, 160.0, 84.0, 65.0, 57.0, 38.0, 21.0, 21.0, 13.0, 12.0, 8.0, 6.0, 7.0, 4.0, 8.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.6875, -36.51806640625, -35.3486328125, -34.17919921875, -33.009765625, -31.84033203125, -30.6708984375, -29.50146484375, -28.33203125, -27.16259765625, -25.9931640625, -24.82373046875, -23.654296875, -22.48486328125, -21.3154296875, -20.14599609375, -18.9765625, -17.80712890625, -16.6376953125, -15.46826171875, -14.298828125, -13.12939453125, -11.9599609375, -10.79052734375, -9.62109375, -8.45166015625, -7.2822265625, -6.11279296875, -4.943359375, -3.77392578125, -2.6044921875, -1.43505859375, -0.265625, 0.90380859375, 2.0732421875, 3.24267578125, 4.412109375, 5.58154296875, 6.7509765625, 7.92041015625, 9.08984375, 10.25927734375, 11.4287109375, 12.59814453125, 13.767578125, 14.93701171875, 16.1064453125, 17.27587890625, 18.4453125, 19.61474609375, 20.7841796875, 21.95361328125, 23.123046875, 24.29248046875, 25.4619140625, 26.63134765625, 27.80078125, 28.97021484375, 30.1396484375, 31.30908203125, 32.478515625, 33.64794921875, 34.8173828125, 35.98681640625, 37.15625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 10.0, 16.0, 18.0, 33.0, 47.0, 70.0, 87.0, 105.0, 101.0, 107.0, 109.0, 90.0, 65.0, 40.0, 37.0, 22.0, 18.0, 10.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9501953125, -0.8942718505859375, -0.838348388671875, -0.7824249267578125, -0.72650146484375, -0.6705780029296875, -0.614654541015625, -0.5587310791015625, -0.5028076171875, -0.4468841552734375, -0.390960693359375, -0.3350372314453125, -0.27911376953125, -0.2231903076171875, -0.167266845703125, -0.1113433837890625, -0.055419921875, 0.0005035400390625, 0.056427001953125, 0.1123504638671875, 0.16827392578125, 0.2241973876953125, 0.280120849609375, 0.3360443115234375, 0.3919677734375, 0.4478912353515625, 0.503814697265625, 0.5597381591796875, 0.61566162109375, 0.6715850830078125, 0.727508544921875, 0.7834320068359375, 0.83935546875, 0.8952789306640625, 0.951202392578125, 1.0071258544921875, 1.06304931640625, 1.1189727783203125, 1.174896240234375, 1.2308197021484375, 1.2867431640625, 1.3426666259765625, 1.398590087890625, 1.4545135498046875, 1.51043701171875, 1.5663604736328125, 1.622283935546875, 1.6782073974609375, 1.734130859375, 1.7900543212890625, 1.845977783203125, 1.9019012451171875, 1.95782470703125, 2.0137481689453125, 2.069671630859375, 2.1255950927734375, 2.1815185546875, 2.2374420166015625, 2.293365478515625, 2.3492889404296875, 2.40521240234375, 2.4611358642578125, 2.517059326171875, 2.5729827880859375, 2.62890625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 5.0, 7.0, 6.0, 9.0, 15.0, 16.0, 20.0, 30.0, 41.0, 56.0, 74.0, 147.0, 201.0, 400.0, 993.0, 5920.0, 4005661.0, 176346.0, 2805.0, 684.0, 309.0, 148.0, 100.0, 74.0, 50.0, 31.0, 33.0, 25.0, 19.0, 12.0, 8.0, 12.0, 1.0, 9.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-66.875, -64.634765625, -62.39453125, -60.154296875, -57.9140625, -55.673828125, -53.43359375, -51.193359375, -48.953125, -46.712890625, -44.47265625, -42.232421875, -39.9921875, -37.751953125, -35.51171875, -33.271484375, -31.03125, -28.791015625, -26.55078125, -24.310546875, -22.0703125, -19.830078125, -17.58984375, -15.349609375, -13.109375, -10.869140625, -8.62890625, -6.388671875, -4.1484375, -1.908203125, 0.33203125, 2.572265625, 4.8125, 7.052734375, 9.29296875, 11.533203125, 13.7734375, 16.013671875, 18.25390625, 20.494140625, 22.734375, 24.974609375, 27.21484375, 29.455078125, 31.6953125, 33.935546875, 36.17578125, 38.416015625, 40.65625, 42.896484375, 45.13671875, 47.376953125, 49.6171875, 51.857421875, 54.09765625, 56.337890625, 58.578125, 60.818359375, 63.05859375, 65.298828125, 67.5390625, 69.779296875, 72.01953125, 74.259765625, 76.5]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 5.0, 7.0, 12.0, 21.0, 29.0, 58.0, 121.0, 246.0, 736.0, 2086.0, 440.0, 131.0, 66.0, 57.0, 23.0, 12.0, 8.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5546875, -5.39727783203125, -5.2398681640625, -5.08245849609375, -4.925048828125, -4.76763916015625, -4.6102294921875, -4.45281982421875, -4.29541015625, -4.13800048828125, -3.9805908203125, -3.82318115234375, -3.665771484375, -3.50836181640625, -3.3509521484375, -3.19354248046875, -3.0361328125, -2.87872314453125, -2.7213134765625, -2.56390380859375, -2.406494140625, -2.24908447265625, -2.0916748046875, -1.93426513671875, -1.77685546875, -1.61944580078125, -1.4620361328125, -1.30462646484375, -1.147216796875, -0.98980712890625, -0.8323974609375, -0.67498779296875, -0.517578125, -0.36016845703125, -0.2027587890625, -0.04534912109375, 0.112060546875, 0.26947021484375, 0.4268798828125, 0.58428955078125, 0.74169921875, 0.89910888671875, 1.0565185546875, 1.21392822265625, 1.371337890625, 1.52874755859375, 1.6861572265625, 1.84356689453125, 2.0009765625, 2.15838623046875, 2.3157958984375, 2.47320556640625, 2.630615234375, 2.78802490234375, 2.9454345703125, 3.10284423828125, 3.26025390625, 3.41766357421875, 3.5750732421875, 3.73248291015625, 3.889892578125, 4.04730224609375, 4.2047119140625, 4.36212158203125, 4.51953125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 5.0, 31.0, 155.0, 610.0, 165.0, 19.0, 13.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.44828796386719, -81.78407287597656, -77.1198501586914, -72.45562744140625, -67.79141235351562, -63.127193450927734, -58.462974548339844, -53.79875564575195, -49.13453674316406, -44.47031784057617, -39.80609893798828, -35.14188003540039, -30.4776611328125, -25.81344223022461, -21.14922332763672, -16.485004425048828, -11.820785522460938, -7.156566619873047, -2.4923477172851562, 2.1718711853027344, 6.836090087890625, 11.500308990478516, 16.164527893066406, 20.828746795654297, 25.492965698242188, 30.157184600830078, 34.82140350341797, 39.48562240600586, 44.14984130859375, 48.81406021118164, 53.47827911376953, 58.14249801635742, 62.80670166015625, 67.47091674804688, 72.13513946533203, 76.79936218261719, 81.46357727050781, 86.12779235839844, 90.7920150756836, 95.45623779296875, 100.12045288085938, 104.78466796875, 109.44889068603516, 114.11311340332031, 118.77732849121094, 123.44154357910156, 128.10577392578125, 132.76998901367188, 137.4342041015625, 142.09841918945312, 146.76263427734375, 151.42686462402344, 156.09107971191406, 160.7552947998047, 165.41952514648438, 170.083740234375, 174.74795532226562, 179.41217041015625, 184.07638549804688, 188.74061584472656, 193.4048309326172, 198.0690460205078, 202.7332763671875, 207.39749145507812, 212.06170654296875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 1.0, 3.0, 6.0, 9.0, 7.0, 9.0, 13.0, 26.0, 17.0, 26.0, 34.0, 31.0, 24.0, 33.0, 29.0, 53.0, 69.0, 51.0, 44.0, 46.0, 55.0, 50.0, 54.0, 33.0, 48.0, 41.0, 38.0, 28.0, 25.0, 14.0, 20.0, 10.0, 18.0, 13.0, 8.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.148128509521484, -11.78049373626709, -11.412859916687012, -11.045225143432617, -10.677590370178223, -10.309955596923828, -9.94232177734375, -9.574687004089355, -9.207052230834961, -8.839417457580566, -8.471783638000488, -8.104148864746094, -7.736514091491699, -7.368879795074463, -7.001245498657227, -6.633610725402832, -6.265976905822754, -5.898342609405518, -5.530707836151123, -5.163073539733887, -4.795438766479492, -4.427804470062256, -4.0601701736450195, -3.692535638809204, -3.3249011039733887, -2.9572665691375732, -2.589632034301758, -2.2219977378845215, -1.854363203048706, -1.4867286682128906, -1.1190943717956543, -0.7514598369598389, -0.38382434844970703, -0.016189873218536377, 0.3514446020126343, 0.7190790176391602, 1.0867135524749756, 1.454348087310791, 1.8219823837280273, 2.1896169185638428, 2.557251453399658, 2.9248859882354736, 3.292520523071289, 3.6601548194885254, 4.027789115905762, 4.395423889160156, 4.763058185577393, 5.130692481994629, 5.498327255249023, 5.86596155166626, 6.233596324920654, 6.601230621337891, 6.968865394592285, 7.3364996910095215, 7.704133987426758, 8.071768760681152, 8.439403533935547, 8.807038307189941, 9.17467212677002, 9.542306900024414, 9.909941673278809, 10.277576446533203, 10.645210266113281, 11.012845039367676, 11.380478858947754]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 5.0, 4.0, 6.0, 10.0, 10.0, 11.0, 13.0, 23.0, 27.0, 42.0, 47.0, 70.0, 124.0, 217.0, 419.0, 932.0, 3118.0, 21005.0, 326661.0, 646269.0, 42022.0, 5017.0, 1247.0, 513.0, 238.0, 146.0, 110.0, 74.0, 50.0, 34.0, 28.0, 12.0, 13.0, 8.0, 9.0, 12.0, 11.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-41.75, -40.6259765625, -39.501953125, -38.3779296875, -37.25390625, -36.1298828125, -35.005859375, -33.8818359375, -32.7578125, -31.6337890625, -30.509765625, -29.3857421875, -28.26171875, -27.1376953125, -26.013671875, -24.8896484375, -23.765625, -22.6416015625, -21.517578125, -20.3935546875, -19.26953125, -18.1455078125, -17.021484375, -15.8974609375, -14.7734375, -13.6494140625, -12.525390625, -11.4013671875, -10.27734375, -9.1533203125, -8.029296875, -6.9052734375, -5.78125, -4.6572265625, -3.533203125, -2.4091796875, -1.28515625, -0.1611328125, 0.962890625, 2.0869140625, 3.2109375, 4.3349609375, 5.458984375, 6.5830078125, 7.70703125, 8.8310546875, 9.955078125, 11.0791015625, 12.203125, 13.3271484375, 14.451171875, 15.5751953125, 16.69921875, 17.8232421875, 18.947265625, 20.0712890625, 21.1953125, 22.3193359375, 23.443359375, 24.5673828125, 25.69140625, 26.8154296875, 27.939453125, 29.0634765625, 30.1875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 5.0, 3.0, 19.0, 19.0, 14.0, 33.0, 78.0, 69.0, 92.0, 114.0, 104.0, 95.0, 95.0, 90.0, 53.0, 44.0, 34.0, 21.0, 9.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1064453125, -1.0429229736328125, -0.979400634765625, -0.9158782958984375, -0.85235595703125, -0.7888336181640625, -0.725311279296875, -0.6617889404296875, -0.5982666015625, -0.5347442626953125, -0.471221923828125, -0.4076995849609375, -0.34417724609375, -0.2806549072265625, -0.217132568359375, -0.1536102294921875, -0.090087890625, -0.0265655517578125, 0.036956787109375, 0.1004791259765625, 0.16400146484375, 0.2275238037109375, 0.291046142578125, 0.3545684814453125, 0.4180908203125, 0.4816131591796875, 0.545135498046875, 0.6086578369140625, 0.67218017578125, 0.7357025146484375, 0.799224853515625, 0.8627471923828125, 0.92626953125, 0.9897918701171875, 1.053314208984375, 1.1168365478515625, 1.18035888671875, 1.2438812255859375, 1.307403564453125, 1.3709259033203125, 1.4344482421875, 1.4979705810546875, 1.561492919921875, 1.6250152587890625, 1.68853759765625, 1.7520599365234375, 1.815582275390625, 1.8791046142578125, 1.942626953125, 2.0061492919921875, 2.069671630859375, 2.1331939697265625, 2.19671630859375, 2.2602386474609375, 2.323760986328125, 2.3872833251953125, 2.4508056640625, 2.5143280029296875, 2.577850341796875, 2.6413726806640625, 2.70489501953125, 2.7684173583984375, 2.831939697265625, 2.8954620361328125, 2.958984375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 15.0, 11.0, 17.0, 28.0, 55.0, 47.0, 79.0, 122.0, 155.0, 305.0, 400.0, 666.0, 1232.0, 2410.0, 5079.0, 12873.0, 43508.0, 199974.0, 521119.0, 194584.0, 42894.0, 12539.0, 4920.0, 2373.0, 1274.0, 705.0, 407.0, 256.0, 180.0, 92.0, 60.0, 45.0, 42.0, 25.0, 19.0, 9.0, 12.0, 7.0, 6.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3515625, -11.9327392578125, -11.513916015625, -11.0950927734375, -10.67626953125, -10.2574462890625, -9.838623046875, -9.4197998046875, -9.0009765625, -8.5821533203125, -8.163330078125, -7.7445068359375, -7.32568359375, -6.9068603515625, -6.488037109375, -6.0692138671875, -5.650390625, -5.2315673828125, -4.812744140625, -4.3939208984375, -3.97509765625, -3.5562744140625, -3.137451171875, -2.7186279296875, -2.2998046875, -1.8809814453125, -1.462158203125, -1.0433349609375, -0.62451171875, -0.2056884765625, 0.213134765625, 0.6319580078125, 1.05078125, 1.4696044921875, 1.888427734375, 2.3072509765625, 2.72607421875, 3.1448974609375, 3.563720703125, 3.9825439453125, 4.4013671875, 4.8201904296875, 5.239013671875, 5.6578369140625, 6.07666015625, 6.4954833984375, 6.914306640625, 7.3331298828125, 7.751953125, 8.1707763671875, 8.589599609375, 9.0084228515625, 9.42724609375, 9.8460693359375, 10.264892578125, 10.6837158203125, 11.1025390625, 11.5213623046875, 11.940185546875, 12.3590087890625, 12.77783203125, 13.1966552734375, 13.615478515625, 14.0343017578125, 14.453125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 5.0, 2.0, 8.0, 6.0, 8.0, 10.0, 14.0, 15.0, 22.0, 19.0, 36.0, 26.0, 31.0, 38.0, 42.0, 34.0, 41.0, 50.0, 47.0, 32.0, 50.0, 59.0, 41.0, 45.0, 59.0, 33.0, 32.0, 24.0, 36.0, 22.0, 27.0, 20.0, 12.0, 8.0, 17.0, 10.0, 6.0, 7.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.25, -5.096435546875, -4.94287109375, -4.789306640625, -4.6357421875, -4.482177734375, -4.32861328125, -4.175048828125, -4.021484375, -3.867919921875, -3.71435546875, -3.560791015625, -3.4072265625, -3.253662109375, -3.10009765625, -2.946533203125, -2.79296875, -2.639404296875, -2.48583984375, -2.332275390625, -2.1787109375, -2.025146484375, -1.87158203125, -1.718017578125, -1.564453125, -1.410888671875, -1.25732421875, -1.103759765625, -0.9501953125, -0.796630859375, -0.64306640625, -0.489501953125, -0.3359375, -0.182373046875, -0.02880859375, 0.124755859375, 0.2783203125, 0.431884765625, 0.58544921875, 0.739013671875, 0.892578125, 1.046142578125, 1.19970703125, 1.353271484375, 1.5068359375, 1.660400390625, 1.81396484375, 1.967529296875, 2.12109375, 2.274658203125, 2.42822265625, 2.581787109375, 2.7353515625, 2.888916015625, 3.04248046875, 3.196044921875, 3.349609375, 3.503173828125, 3.65673828125, 3.810302734375, 3.9638671875, 4.117431640625, 4.27099609375, 4.424560546875, 4.578125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 7.0, 12.0, 12.0, 14.0, 14.0, 43.0, 36.0, 69.0, 138.0, 201.0, 454.0, 874.0, 1960.0, 5483.0, 19276.0, 110393.0, 635328.0, 228284.0, 32676.0, 8242.0, 2718.0, 1131.0, 545.0, 255.0, 145.0, 93.0, 53.0, 29.0, 20.0, 22.0, 9.0, 6.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.234375, -7.98980712890625, -7.7452392578125, -7.50067138671875, -7.256103515625, -7.01153564453125, -6.7669677734375, -6.52239990234375, -6.27783203125, -6.03326416015625, -5.7886962890625, -5.54412841796875, -5.299560546875, -5.05499267578125, -4.8104248046875, -4.56585693359375, -4.3212890625, -4.07672119140625, -3.8321533203125, -3.58758544921875, -3.343017578125, -3.09844970703125, -2.8538818359375, -2.60931396484375, -2.36474609375, -2.12017822265625, -1.8756103515625, -1.63104248046875, -1.386474609375, -1.14190673828125, -0.8973388671875, -0.65277099609375, -0.408203125, -0.16363525390625, 0.0809326171875, 0.32550048828125, 0.570068359375, 0.81463623046875, 1.0592041015625, 1.30377197265625, 1.54833984375, 1.79290771484375, 2.0374755859375, 2.28204345703125, 2.526611328125, 2.77117919921875, 3.0157470703125, 3.26031494140625, 3.5048828125, 3.74945068359375, 3.9940185546875, 4.23858642578125, 4.483154296875, 4.72772216796875, 4.9722900390625, 5.21685791015625, 5.46142578125, 5.70599365234375, 5.9505615234375, 6.19512939453125, 6.439697265625, 6.68426513671875, 6.9288330078125, 7.17340087890625, 7.41796875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 6.0, 4.0, 7.0, 13.0, 13.0, 26.0, 22.0, 49.0, 63.0, 78.0, 88.0, 102.0, 81.0, 104.0, 83.0, 80.0, 64.0, 46.0, 17.0, 14.0, 10.0, 10.0, 8.0, 6.0, 3.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010776519775390625, -0.0010452866554260254, -0.0010129213333129883, -0.0009805560111999512, -0.0009481906890869141, -0.000915825366973877, -0.0008834600448608398, -0.0008510947227478027, -0.0008187294006347656, -0.0007863640785217285, -0.0007539987564086914, -0.0007216334342956543, -0.0006892681121826172, -0.0006569027900695801, -0.000624537467956543, -0.0005921721458435059, -0.0005598068237304688, -0.0005274415016174316, -0.0004950761795043945, -0.0004627108573913574, -0.0004303455352783203, -0.0003979802131652832, -0.0003656148910522461, -0.000333249568939209, -0.0003008842468261719, -0.00026851892471313477, -0.00023615360260009766, -0.00020378828048706055, -0.00017142295837402344, -0.00013905763626098633, -0.00010669231414794922, -7.432699203491211e-05, -4.1961669921875e-05, -9.59634780883789e-06, 2.276897430419922e-05, 5.513429641723633e-05, 8.749961853027344e-05, 0.00011986494064331055, 0.00015223026275634766, 0.00018459558486938477, 0.00021696090698242188, 0.000249326229095459, 0.0002816915512084961, 0.0003140568733215332, 0.0003464221954345703, 0.0003787875175476074, 0.00041115283966064453, 0.00044351816177368164, 0.00047588348388671875, 0.0005082488059997559, 0.000540614128112793, 0.0005729794502258301, 0.0006053447723388672, 0.0006377100944519043, 0.0006700754165649414, 0.0007024407386779785, 0.0007348060607910156, 0.0007671713829040527, 0.0007995367050170898, 0.000831902027130127, 0.0008642673492431641, 0.0008966326713562012, 0.0009289979934692383, 0.0009613633155822754, 0.0009937286376953125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 2.0, 5.0, 9.0, 4.0, 9.0, 11.0, 13.0, 17.0, 17.0, 33.0, 51.0, 80.0, 113.0, 186.0, 354.0, 621.0, 1338.0, 3081.0, 10106.0, 47241.0, 422805.0, 490705.0, 54055.0, 11329.0, 3333.0, 1339.0, 677.0, 363.0, 231.0, 137.0, 84.0, 67.0, 45.0, 19.0, 22.0, 9.0, 10.0, 11.0, 9.0, 3.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.08984375, -6.85382080078125, -6.6177978515625, -6.38177490234375, -6.145751953125, -5.90972900390625, -5.6737060546875, -5.43768310546875, -5.20166015625, -4.96563720703125, -4.7296142578125, -4.49359130859375, -4.257568359375, -4.02154541015625, -3.7855224609375, -3.54949951171875, -3.3134765625, -3.07745361328125, -2.8414306640625, -2.60540771484375, -2.369384765625, -2.13336181640625, -1.8973388671875, -1.66131591796875, -1.42529296875, -1.18927001953125, -0.9532470703125, -0.71722412109375, -0.481201171875, -0.24517822265625, -0.0091552734375, 0.22686767578125, 0.462890625, 0.69891357421875, 0.9349365234375, 1.17095947265625, 1.406982421875, 1.64300537109375, 1.8790283203125, 2.11505126953125, 2.35107421875, 2.58709716796875, 2.8231201171875, 3.05914306640625, 3.295166015625, 3.53118896484375, 3.7672119140625, 4.00323486328125, 4.2392578125, 4.47528076171875, 4.7113037109375, 4.94732666015625, 5.183349609375, 5.41937255859375, 5.6553955078125, 5.89141845703125, 6.12744140625, 6.36346435546875, 6.5994873046875, 6.83551025390625, 7.071533203125, 7.30755615234375, 7.5435791015625, 7.77960205078125, 8.015625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 0.0, 0.0, 4.0, 5.0, 7.0, 7.0, 8.0, 10.0, 14.0, 14.0, 19.0, 18.0, 30.0, 33.0, 44.0, 55.0, 49.0, 65.0, 94.0, 74.0, 63.0, 51.0, 59.0, 51.0, 38.0, 23.0, 31.0, 30.0, 16.0, 9.0, 8.0, 12.0, 8.0, 9.0, 6.0, 8.0, 6.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.201171875, -3.095245361328125, -2.98931884765625, -2.883392333984375, -2.7774658203125, -2.671539306640625, -2.56561279296875, -2.459686279296875, -2.353759765625, -2.247833251953125, -2.14190673828125, -2.035980224609375, -1.9300537109375, -1.824127197265625, -1.71820068359375, -1.612274169921875, -1.50634765625, -1.400421142578125, -1.29449462890625, -1.188568115234375, -1.0826416015625, -0.976715087890625, -0.87078857421875, -0.764862060546875, -0.658935546875, -0.553009033203125, -0.44708251953125, -0.341156005859375, -0.2352294921875, -0.129302978515625, -0.02337646484375, 0.082550048828125, 0.1884765625, 0.294403076171875, 0.40032958984375, 0.506256103515625, 0.6121826171875, 0.718109130859375, 0.82403564453125, 0.929962158203125, 1.035888671875, 1.141815185546875, 1.24774169921875, 1.353668212890625, 1.4595947265625, 1.565521240234375, 1.67144775390625, 1.777374267578125, 1.88330078125, 1.989227294921875, 2.09515380859375, 2.201080322265625, 2.3070068359375, 2.412933349609375, 2.51885986328125, 2.624786376953125, 2.730712890625, 2.836639404296875, 2.94256591796875, 3.048492431640625, 3.1544189453125, 3.260345458984375, 3.36627197265625, 3.472198486328125, 3.578125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 8.0, 7.0, 8.0, 28.0, 64.0, 104.0, 186.0, 215.0, 189.0, 98.0, 53.0, 22.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.53807830810547, -87.35637664794922, -84.17467498779297, -80.99297332763672, -77.81127166748047, -74.62957000732422, -71.4478759765625, -68.26617431640625, -65.08447265625, -61.90277099609375, -58.7210693359375, -55.53936767578125, -52.357666015625, -49.17596435546875, -45.994266510009766, -42.812564849853516, -39.630859375, -36.44915771484375, -33.2674560546875, -30.085756301879883, -26.904054641723633, -23.722352981567383, -20.540653228759766, -17.358951568603516, -14.177249908447266, -10.995548248291016, -7.813847541809082, -4.632146835327148, -1.4504451751708984, 1.7312564849853516, 4.912956237792969, 8.094657897949219, 11.2763671875, 14.45806884765625, 17.6397705078125, 20.821470260620117, 24.003171920776367, 27.184873580932617, 30.366573333740234, 33.548274993896484, 36.729976654052734, 39.911678314208984, 43.093379974365234, 46.27507781982422, 49.45677947998047, 52.63848114013672, 55.82018280029297, 59.00188446044922, 62.18358612060547, 65.36528778076172, 68.54698944091797, 71.72869110107422, 74.91039276123047, 78.09209442138672, 81.27378845214844, 84.45549011230469, 87.63719177246094, 90.81889343261719, 94.00059509277344, 97.18229675292969, 100.36399841308594, 103.54570007324219, 106.72740173339844, 109.90910339355469, 113.09080505371094]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 7.0, 8.0, 12.0, 10.0, 15.0, 14.0, 31.0, 18.0, 46.0, 37.0, 43.0, 44.0, 53.0, 46.0, 47.0, 69.0, 51.0, 71.0, 48.0, 41.0, 39.0, 42.0, 41.0, 28.0, 29.0, 22.0, 23.0, 16.0, 12.0, 15.0, 9.0, 9.0, 3.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-43.32777786254883, -42.214908599853516, -41.10203552246094, -39.989166259765625, -38.87629699707031, -37.763427734375, -36.65055465698242, -35.53768539428711, -34.42481231689453, -33.31194305419922, -32.19906997680664, -31.086200714111328, -29.973331451416016, -28.86046028137207, -27.747589111328125, -26.634719848632812, -25.5218505859375, -24.408979415893555, -23.296110153198242, -22.183238983154297, -21.070369720458984, -19.95749855041504, -18.844627380371094, -17.73175811767578, -16.618886947631836, -15.506016731262207, -14.393146514892578, -13.280275344848633, -12.167405128479004, -11.054534912109375, -9.94166374206543, -8.8287935256958, -7.715923309326172, -6.603053092956543, -5.490182399749756, -4.377311706542969, -3.26444149017334, -2.151571273803711, -1.0387005805969238, 0.07417011260986328, 1.1870403289794922, 2.2999107837677, 3.412781238555908, 4.525651931762695, 5.638522148132324, 6.751392364501953, 7.86426305770874, 8.977133750915527, 10.090003967285156, 11.202874183654785, 12.315744400024414, 13.42861557006836, 14.541485786437988, 15.654356002807617, 16.767227172851562, 17.880096435546875, 18.99296760559082, 20.105838775634766, 21.218708038330078, 22.331579208374023, 23.44445037841797, 24.55731964111328, 25.670190811157227, 26.783061981201172, 27.895931243896484]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 4.0, 3.0, 8.0, 10.0, 16.0, 15.0, 17.0, 29.0, 51.0, 70.0, 135.0, 213.0, 544.0, 1508.0, 5420.0, 36115.0, 3443091.0, 677403.0, 23130.0, 4132.0, 1247.0, 492.0, 227.0, 135.0, 97.0, 45.0, 29.0, 27.0, 11.0, 8.0, 17.0, 10.0, 9.0, 5.0, 1.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.28125, -20.459716796875, -19.63818359375, -18.816650390625, -17.9951171875, -17.173583984375, -16.35205078125, -15.530517578125, -14.708984375, -13.887451171875, -13.06591796875, -12.244384765625, -11.4228515625, -10.601318359375, -9.77978515625, -8.958251953125, -8.13671875, -7.315185546875, -6.49365234375, -5.672119140625, -4.8505859375, -4.029052734375, -3.20751953125, -2.385986328125, -1.564453125, -0.742919921875, 0.07861328125, 0.900146484375, 1.7216796875, 2.543212890625, 3.36474609375, 4.186279296875, 5.0078125, 5.829345703125, 6.65087890625, 7.472412109375, 8.2939453125, 9.115478515625, 9.93701171875, 10.758544921875, 11.580078125, 12.401611328125, 13.22314453125, 14.044677734375, 14.8662109375, 15.687744140625, 16.50927734375, 17.330810546875, 18.15234375, 18.973876953125, 19.79541015625, 20.616943359375, 21.4384765625, 22.260009765625, 23.08154296875, 23.903076171875, 24.724609375, 25.546142578125, 26.36767578125, 27.189208984375, 28.0107421875, 28.832275390625, 29.65380859375, 30.475341796875, 31.296875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 1.0, 6.0, 4.0, 10.0, 20.0, 28.0, 41.0, 65.0, 82.0, 110.0, 107.0, 114.0, 107.0, 84.0, 78.0, 56.0, 36.0, 27.0, 11.0, 10.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1787109375, -1.1099090576171875, -1.041107177734375, -0.9723052978515625, -0.90350341796875, -0.8347015380859375, -0.765899658203125, -0.6970977783203125, -0.6282958984375, -0.5594940185546875, -0.490692138671875, -0.4218902587890625, -0.35308837890625, -0.2842864990234375, -0.215484619140625, -0.1466827392578125, -0.077880859375, -0.0090789794921875, 0.059722900390625, 0.1285247802734375, 0.19732666015625, 0.2661285400390625, 0.334930419921875, 0.4037322998046875, 0.4725341796875, 0.5413360595703125, 0.610137939453125, 0.6789398193359375, 0.74774169921875, 0.8165435791015625, 0.885345458984375, 0.9541473388671875, 1.02294921875, 1.0917510986328125, 1.160552978515625, 1.2293548583984375, 1.29815673828125, 1.3669586181640625, 1.435760498046875, 1.5045623779296875, 1.5733642578125, 1.6421661376953125, 1.710968017578125, 1.7797698974609375, 1.84857177734375, 1.9173736572265625, 1.986175537109375, 2.0549774169921875, 2.123779296875, 2.1925811767578125, 2.261383056640625, 2.3301849365234375, 2.39898681640625, 2.4677886962890625, 2.536590576171875, 2.6053924560546875, 2.6741943359375, 2.7429962158203125, 2.811798095703125, 2.8805999755859375, 2.94940185546875, 3.0182037353515625, 3.087005615234375, 3.1558074951171875, 3.224609375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 5.0, 11.0, 12.0, 24.0, 39.0, 76.0, 133.0, 395.0, 9278.0, 4182628.0, 1155.0, 203.0, 107.0, 57.0, 53.0, 41.0, 26.0, 12.0, 13.0, 7.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.625, -106.615234375, -101.60546875, -96.595703125, -91.5859375, -86.576171875, -81.56640625, -76.556640625, -71.546875, -66.537109375, -61.52734375, -56.517578125, -51.5078125, -46.498046875, -41.48828125, -36.478515625, -31.46875, -26.458984375, -21.44921875, -16.439453125, -11.4296875, -6.419921875, -1.41015625, 3.599609375, 8.609375, 13.619140625, 18.62890625, 23.638671875, 28.6484375, 33.658203125, 38.66796875, 43.677734375, 48.6875, 53.697265625, 58.70703125, 63.716796875, 68.7265625, 73.736328125, 78.74609375, 83.755859375, 88.765625, 93.775390625, 98.78515625, 103.794921875, 108.8046875, 113.814453125, 118.82421875, 123.833984375, 128.84375, 133.853515625, 138.86328125, 143.873046875, 148.8828125, 153.892578125, 158.90234375, 163.912109375, 168.921875, 173.931640625, 178.94140625, 183.951171875, 188.9609375, 193.970703125, 198.98046875, 203.990234375, 209.0]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 11.0, 84.0, 837.0, 2980.0, 145.0, 16.0, 5.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8515625, -9.2769775390625, -8.702392578125, -8.1278076171875, -7.55322265625, -6.9786376953125, -6.404052734375, -5.8294677734375, -5.2548828125, -4.6802978515625, -4.105712890625, -3.5311279296875, -2.95654296875, -2.3819580078125, -1.807373046875, -1.2327880859375, -0.658203125, -0.0836181640625, 0.490966796875, 1.0655517578125, 1.64013671875, 2.2147216796875, 2.789306640625, 3.3638916015625, 3.9384765625, 4.5130615234375, 5.087646484375, 5.6622314453125, 6.23681640625, 6.8114013671875, 7.385986328125, 7.9605712890625, 8.53515625, 9.1097412109375, 9.684326171875, 10.2589111328125, 10.83349609375, 11.4080810546875, 11.982666015625, 12.5572509765625, 13.1318359375, 13.7064208984375, 14.281005859375, 14.8555908203125, 15.43017578125, 16.0047607421875, 16.579345703125, 17.1539306640625, 17.728515625, 18.3031005859375, 18.877685546875, 19.4522705078125, 20.02685546875, 20.6014404296875, 21.176025390625, 21.7506103515625, 22.3251953125, 22.8997802734375, 23.474365234375, 24.0489501953125, 24.62353515625, 25.1981201171875, 25.772705078125, 26.3472900390625, 26.921875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 14.0, 729.0, 258.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-465.19134521484375, -455.4664001464844, -445.7414855957031, -436.01654052734375, -426.2915954589844, -416.566650390625, -406.84173583984375, -397.1167907714844, -387.391845703125, -377.6669006347656, -367.9419860839844, -358.217041015625, -348.4920959472656, -338.76715087890625, -329.042236328125, -319.3172912597656, -309.5923767089844, -299.867431640625, -290.14251708984375, -280.4175720214844, -270.692626953125, -260.96771240234375, -251.24276733398438, -241.517822265625, -231.7928924560547, -222.06796264648438, -212.343017578125, -202.6180877685547, -192.89315795898438, -183.168212890625, -173.4432830810547, -163.71835327148438, -153.993408203125, -144.2684783935547, -134.5435333251953, -124.818603515625, -115.09366607666016, -105.36872863769531, -95.643798828125, -85.91886138916016, -76.19392395019531, -66.46898651123047, -56.74405288696289, -47.01911926269531, -37.29418182373047, -27.569244384765625, -17.844310760498047, -8.119377136230469, 1.605560302734375, 11.330495834350586, 21.055431365966797, 30.780366897583008, 40.50530242919922, 50.23023986816406, 59.95517349243164, 69.68010711669922, 79.40504455566406, 89.1299819946289, 98.85491943359375, 108.57984924316406, 118.3047866821289, 128.02972412109375, 137.75465393066406, 147.47958374023438, 157.20452880859375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 10.0, 24.0, 37.0, 65.0, 87.0, 114.0, 133.0, 138.0, 133.0, 102.0, 72.0, 46.0, 17.0, 11.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-45.88655090332031, -44.566627502441406, -43.246700286865234, -41.92677307128906, -40.606849670410156, -39.28692626953125, -37.96699905395508, -36.647071838378906, -35.3271484375, -34.007225036621094, -32.68729782104492, -31.367372512817383, -30.047447204589844, -28.727521896362305, -27.407596588134766, -26.087671279907227, -24.767745971679688, -23.44782066345215, -22.12789535522461, -20.80797004699707, -19.48804473876953, -18.168119430541992, -16.848194122314453, -15.528268814086914, -14.208343505859375, -12.888418197631836, -11.568492889404297, -10.248567581176758, -8.928642272949219, -7.60871696472168, -6.288791656494141, -4.968866348266602, -3.6489410400390625, -2.3290157318115234, -1.0090904235839844, 0.3108348846435547, 1.6307601928710938, 2.950685501098633, 4.270610809326172, 5.590536117553711, 6.91046142578125, 8.230386734008789, 9.550312042236328, 10.870237350463867, 12.190162658691406, 13.510087966918945, 14.830013275146484, 16.149938583374023, 17.469863891601562, 18.7897891998291, 20.10971450805664, 21.42963981628418, 22.74956512451172, 24.069490432739258, 25.389415740966797, 26.709341049194336, 28.029266357421875, 29.349191665649414, 30.669116973876953, 31.989042282104492, 33.30896759033203, 34.62889099121094, 35.94881820678711, 37.26874542236328, 38.58866882324219]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 6.0, 7.0, 12.0, 11.0, 13.0, 17.0, 23.0, 21.0, 43.0, 55.0, 58.0, 93.0, 147.0, 291.0, 580.0, 1477.0, 5768.0, 34023.0, 288166.0, 608503.0, 91744.0, 12846.0, 2778.0, 880.0, 377.0, 193.0, 113.0, 94.0, 49.0, 38.0, 28.0, 21.0, 18.0, 14.0, 11.0, 8.0, 8.0, 5.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.796875, -20.109130859375, -19.42138671875, -18.733642578125, -18.0458984375, -17.358154296875, -16.67041015625, -15.982666015625, -15.294921875, -14.607177734375, -13.91943359375, -13.231689453125, -12.5439453125, -11.856201171875, -11.16845703125, -10.480712890625, -9.79296875, -9.105224609375, -8.41748046875, -7.729736328125, -7.0419921875, -6.354248046875, -5.66650390625, -4.978759765625, -4.291015625, -3.603271484375, -2.91552734375, -2.227783203125, -1.5400390625, -0.852294921875, -0.16455078125, 0.523193359375, 1.2109375, 1.898681640625, 2.58642578125, 3.274169921875, 3.9619140625, 4.649658203125, 5.33740234375, 6.025146484375, 6.712890625, 7.400634765625, 8.08837890625, 8.776123046875, 9.4638671875, 10.151611328125, 10.83935546875, 11.527099609375, 12.21484375, 12.902587890625, 13.59033203125, 14.278076171875, 14.9658203125, 15.653564453125, 16.34130859375, 17.029052734375, 17.716796875, 18.404541015625, 19.09228515625, 19.780029296875, 20.4677734375, 21.155517578125, 21.84326171875, 22.531005859375, 23.21875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 1.0, 3.0, 6.0, 12.0, 18.0, 43.0, 51.0, 68.0, 96.0, 117.0, 131.0, 144.0, 88.0, 87.0, 58.0, 37.0, 21.0, 13.0, 9.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.58203125, -1.4920654296875, -1.402099609375, -1.3121337890625, -1.22216796875, -1.1322021484375, -1.042236328125, -0.9522705078125, -0.8623046875, -0.7723388671875, -0.682373046875, -0.5924072265625, -0.50244140625, -0.4124755859375, -0.322509765625, -0.2325439453125, -0.142578125, -0.0526123046875, 0.037353515625, 0.1273193359375, 0.21728515625, 0.3072509765625, 0.397216796875, 0.4871826171875, 0.5771484375, 0.6671142578125, 0.757080078125, 0.8470458984375, 0.93701171875, 1.0269775390625, 1.116943359375, 1.2069091796875, 1.296875, 1.3868408203125, 1.476806640625, 1.5667724609375, 1.65673828125, 1.7467041015625, 1.836669921875, 1.9266357421875, 2.0166015625, 2.1065673828125, 2.196533203125, 2.2864990234375, 2.37646484375, 2.4664306640625, 2.556396484375, 2.6463623046875, 2.736328125, 2.8262939453125, 2.916259765625, 3.0062255859375, 3.09619140625, 3.1861572265625, 3.276123046875, 3.3660888671875, 3.4560546875, 3.5460205078125, 3.635986328125, 3.7259521484375, 3.81591796875, 3.9058837890625, 3.995849609375, 4.0858154296875, 4.17578125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 9.0, 4.0, 11.0, 8.0, 10.0, 21.0, 19.0, 23.0, 44.0, 66.0, 79.0, 101.0, 152.0, 201.0, 306.0, 466.0, 737.0, 1122.0, 2093.0, 3604.0, 7378.0, 18442.0, 58119.0, 212561.0, 443246.0, 208799.0, 56549.0, 18026.0, 7294.0, 3699.0, 1890.0, 1168.0, 752.0, 459.0, 319.0, 219.0, 161.0, 95.0, 73.0, 57.0, 43.0, 39.0, 21.0, 13.0, 13.0, 10.0, 10.0, 4.0, 2.0, 8.0, 3.0, 1.0, 3.0, 4.0, 0.0, 0.0, 2.0, 2.0], "bins": [-10.8125, -10.4578857421875, -10.103271484375, -9.7486572265625, -9.39404296875, -9.0394287109375, -8.684814453125, -8.3302001953125, -7.9755859375, -7.6209716796875, -7.266357421875, -6.9117431640625, -6.55712890625, -6.2025146484375, -5.847900390625, -5.4932861328125, -5.138671875, -4.7840576171875, -4.429443359375, -4.0748291015625, -3.72021484375, -3.3656005859375, -3.010986328125, -2.6563720703125, -2.3017578125, -1.9471435546875, -1.592529296875, -1.2379150390625, -0.88330078125, -0.5286865234375, -0.174072265625, 0.1805419921875, 0.53515625, 0.8897705078125, 1.244384765625, 1.5989990234375, 1.95361328125, 2.3082275390625, 2.662841796875, 3.0174560546875, 3.3720703125, 3.7266845703125, 4.081298828125, 4.4359130859375, 4.79052734375, 5.1451416015625, 5.499755859375, 5.8543701171875, 6.208984375, 6.5635986328125, 6.918212890625, 7.2728271484375, 7.62744140625, 7.9820556640625, 8.336669921875, 8.6912841796875, 9.0458984375, 9.4005126953125, 9.755126953125, 10.1097412109375, 10.46435546875, 10.8189697265625, 11.173583984375, 11.5281982421875, 11.8828125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 8.0, 1.0, 9.0, 6.0, 16.0, 15.0, 18.0, 21.0, 21.0, 34.0, 24.0, 29.0, 45.0, 31.0, 38.0, 56.0, 42.0, 53.0, 48.0, 46.0, 51.0, 52.0, 37.0, 43.0, 43.0, 37.0, 28.0, 24.0, 19.0, 20.0, 28.0, 8.0, 13.0, 13.0, 9.0, 7.0, 5.0, 2.0, 1.0, 7.0, 0.0, 1.0, 3.0], "bins": [-7.6875, -7.49310302734375, -7.2987060546875, -7.10430908203125, -6.909912109375, -6.71551513671875, -6.5211181640625, -6.32672119140625, -6.13232421875, -5.93792724609375, -5.7435302734375, -5.54913330078125, -5.354736328125, -5.16033935546875, -4.9659423828125, -4.77154541015625, -4.5771484375, -4.38275146484375, -4.1883544921875, -3.99395751953125, -3.799560546875, -3.60516357421875, -3.4107666015625, -3.21636962890625, -3.02197265625, -2.82757568359375, -2.6331787109375, -2.43878173828125, -2.244384765625, -2.04998779296875, -1.8555908203125, -1.66119384765625, -1.466796875, -1.27239990234375, -1.0780029296875, -0.88360595703125, -0.689208984375, -0.49481201171875, -0.3004150390625, -0.10601806640625, 0.08837890625, 0.28277587890625, 0.4771728515625, 0.67156982421875, 0.865966796875, 1.06036376953125, 1.2547607421875, 1.44915771484375, 1.6435546875, 1.83795166015625, 2.0323486328125, 2.22674560546875, 2.421142578125, 2.61553955078125, 2.8099365234375, 3.00433349609375, 3.19873046875, 3.39312744140625, 3.5875244140625, 3.78192138671875, 3.976318359375, 4.17071533203125, 4.3651123046875, 4.55950927734375, 4.75390625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 13.0, 15.0, 7.0, 26.0, 27.0, 48.0, 65.0, 129.0, 253.0, 533.0, 1315.0, 4615.0, 28121.0, 763394.0, 232425.0, 13011.0, 2729.0, 935.0, 401.0, 212.0, 106.0, 70.0, 32.0, 28.0, 15.0, 14.0, 11.0, 7.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.3828125, -12.9017333984375, -12.420654296875, -11.9395751953125, -11.45849609375, -10.9774169921875, -10.496337890625, -10.0152587890625, -9.5341796875, -9.0531005859375, -8.572021484375, -8.0909423828125, -7.60986328125, -7.1287841796875, -6.647705078125, -6.1666259765625, -5.685546875, -5.2044677734375, -4.723388671875, -4.2423095703125, -3.76123046875, -3.2801513671875, -2.799072265625, -2.3179931640625, -1.8369140625, -1.3558349609375, -0.874755859375, -0.3936767578125, 0.08740234375, 0.5684814453125, 1.049560546875, 1.5306396484375, 2.01171875, 2.4927978515625, 2.973876953125, 3.4549560546875, 3.93603515625, 4.4171142578125, 4.898193359375, 5.3792724609375, 5.8603515625, 6.3414306640625, 6.822509765625, 7.3035888671875, 7.78466796875, 8.2657470703125, 8.746826171875, 9.2279052734375, 9.708984375, 10.1900634765625, 10.671142578125, 11.1522216796875, 11.63330078125, 12.1143798828125, 12.595458984375, 13.0765380859375, 13.5576171875, 14.0386962890625, 14.519775390625, 15.0008544921875, 15.48193359375, 15.9630126953125, 16.444091796875, 16.9251708984375, 17.40625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 10.0, 23.0, 51.0, 91.0, 166.0, 222.0, 188.0, 119.0, 63.0, 30.0, 15.0, 8.0, 8.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022602081298828125, -0.002181708812713623, -0.0021032094955444336, -0.002024710178375244, -0.0019462108612060547, -0.0018677115440368652, -0.0017892122268676758, -0.0017107129096984863, -0.0016322135925292969, -0.0015537142753601074, -0.001475214958190918, -0.0013967156410217285, -0.001318216323852539, -0.0012397170066833496, -0.0011612176895141602, -0.0010827183723449707, -0.0010042190551757812, -0.0009257197380065918, -0.0008472204208374023, -0.0007687211036682129, -0.0006902217864990234, -0.000611722469329834, -0.0005332231521606445, -0.0004547238349914551, -0.0003762245178222656, -0.00029772520065307617, -0.00021922588348388672, -0.00014072656631469727, -6.222724914550781e-05, 1.627206802368164e-05, 9.47713851928711e-05, 0.00017327070236206055, 0.00025177001953125, 0.00033026933670043945, 0.0004087686538696289, 0.00048726797103881836, 0.0005657672882080078, 0.0006442666053771973, 0.0007227659225463867, 0.0008012652397155762, 0.0008797645568847656, 0.0009582638740539551, 0.0010367631912231445, 0.001115262508392334, 0.0011937618255615234, 0.0012722611427307129, 0.0013507604598999023, 0.0014292597770690918, 0.0015077590942382812, 0.0015862584114074707, 0.0016647577285766602, 0.0017432570457458496, 0.001821756362915039, 0.0019002556800842285, 0.001978754997253418, 0.0020572543144226074, 0.002135753631591797, 0.0022142529487609863, 0.0022927522659301758, 0.0023712515830993652, 0.0024497509002685547, 0.002528250217437744, 0.0026067495346069336, 0.002685248851776123, 0.0027637481689453125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 8.0, 9.0, 6.0, 9.0, 18.0, 25.0, 40.0, 58.0, 74.0, 162.0, 264.0, 580.0, 1205.0, 3371.0, 14469.0, 173898.0, 784003.0, 58443.0, 7896.0, 2103.0, 902.0, 437.0, 194.0, 127.0, 73.0, 48.0, 42.0, 29.0, 14.0, 15.0, 11.0, 5.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.1015625, -8.7801513671875, -8.458740234375, -8.1373291015625, -7.81591796875, -7.4945068359375, -7.173095703125, -6.8516845703125, -6.5302734375, -6.2088623046875, -5.887451171875, -5.5660400390625, -5.24462890625, -4.9232177734375, -4.601806640625, -4.2803955078125, -3.958984375, -3.6375732421875, -3.316162109375, -2.9947509765625, -2.67333984375, -2.3519287109375, -2.030517578125, -1.7091064453125, -1.3876953125, -1.0662841796875, -0.744873046875, -0.4234619140625, -0.10205078125, 0.2193603515625, 0.540771484375, 0.8621826171875, 1.18359375, 1.5050048828125, 1.826416015625, 2.1478271484375, 2.46923828125, 2.7906494140625, 3.112060546875, 3.4334716796875, 3.7548828125, 4.0762939453125, 4.397705078125, 4.7191162109375, 5.04052734375, 5.3619384765625, 5.683349609375, 6.0047607421875, 6.326171875, 6.6475830078125, 6.968994140625, 7.2904052734375, 7.61181640625, 7.9332275390625, 8.254638671875, 8.5760498046875, 8.8974609375, 9.2188720703125, 9.540283203125, 9.8616943359375, 10.18310546875, 10.5045166015625, 10.825927734375, 11.1473388671875, 11.46875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 8.0, 2.0, 5.0, 10.0, 6.0, 15.0, 19.0, 18.0, 24.0, 34.0, 59.0, 57.0, 102.0, 122.0, 114.0, 97.0, 72.0, 52.0, 55.0, 32.0, 18.0, 21.0, 11.0, 12.0, 5.0, 8.0, 4.0, 3.0, 6.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.6796875, -5.50836181640625, -5.3370361328125, -5.16571044921875, -4.994384765625, -4.82305908203125, -4.6517333984375, -4.48040771484375, -4.30908203125, -4.13775634765625, -3.9664306640625, -3.79510498046875, -3.623779296875, -3.45245361328125, -3.2811279296875, -3.10980224609375, -2.9384765625, -2.76715087890625, -2.5958251953125, -2.42449951171875, -2.253173828125, -2.08184814453125, -1.9105224609375, -1.73919677734375, -1.56787109375, -1.39654541015625, -1.2252197265625, -1.05389404296875, -0.882568359375, -0.71124267578125, -0.5399169921875, -0.36859130859375, -0.197265625, -0.02593994140625, 0.1453857421875, 0.31671142578125, 0.488037109375, 0.65936279296875, 0.8306884765625, 1.00201416015625, 1.17333984375, 1.34466552734375, 1.5159912109375, 1.68731689453125, 1.858642578125, 2.02996826171875, 2.2012939453125, 2.37261962890625, 2.5439453125, 2.71527099609375, 2.8865966796875, 3.05792236328125, 3.229248046875, 3.40057373046875, 3.5718994140625, 3.74322509765625, 3.91455078125, 4.08587646484375, 4.2572021484375, 4.42852783203125, 4.599853515625, 4.77117919921875, 4.9425048828125, 5.11383056640625, 5.28515625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 4.0, 9.0, 8.0, 18.0, 51.0, 236.0, 398.0, 202.0, 61.0, 9.0, 10.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-321.8060302734375, -314.737548828125, -307.6690368652344, -300.6005554199219, -293.53204345703125, -286.46356201171875, -279.3950500488281, -272.3265686035156, -265.258056640625, -258.1895751953125, -251.12106323242188, -244.0525665283203, -236.98406982421875, -229.91558837890625, -222.84707641601562, -215.77859497070312, -208.71011352539062, -201.64161682128906, -194.5731201171875, -187.50462341308594, -180.43612670898438, -173.36764526367188, -166.29913330078125, -159.23065185546875, -152.16213989257812, -145.09364318847656, -138.025146484375, -130.95664978027344, -123.8881607055664, -116.81966400146484, -109.75116729736328, -102.68267822265625, -95.61418151855469, -88.54568481445312, -81.47718811035156, -74.40869140625, -67.34020233154297, -60.271705627441406, -53.203208923339844, -46.13471603393555, -39.066219329833984, -31.997724533081055, -24.929229736328125, -17.860733032226562, -10.792238235473633, -3.723743438720703, 3.3447532653808594, 10.413246154785156, 17.48174285888672, 24.55023765563965, 31.618732452392578, 38.68722915649414, 45.75572204589844, 52.82421875, 59.89271545410156, 66.96121215820312, 74.02970886230469, 81.09820556640625, 88.16670227050781, 95.23519897460938, 102.3036880493164, 109.37218475341797, 116.44068145751953, 123.50917053222656, 130.57766723632812]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 7.0, 5.0, 8.0, 6.0, 6.0, 13.0, 22.0, 25.0, 23.0, 36.0, 41.0, 57.0, 61.0, 50.0, 65.0, 62.0, 64.0, 72.0, 56.0, 66.0, 48.0, 54.0, 31.0, 29.0, 24.0, 17.0, 21.0, 13.0, 5.0, 5.0, 8.0, 3.0, 5.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.91390609741211, -28.359495162963867, -26.805084228515625, -25.250673294067383, -23.69626235961914, -22.1418514251709, -20.587440490722656, -19.033029556274414, -17.478618621826172, -15.92420768737793, -14.369796752929688, -12.815385818481445, -11.260974884033203, -9.706563949584961, -8.152153015136719, -6.597742080688477, -5.043331146240234, -3.488920211791992, -1.93450927734375, -0.3800983428955078, 1.1743125915527344, 2.7287235260009766, 4.283134460449219, 5.837545394897461, 7.391956329345703, 8.946367263793945, 10.500778198242188, 12.05518913269043, 13.609600067138672, 15.164011001586914, 16.718421936035156, 18.2728328704834, 19.827239990234375, 21.381650924682617, 22.93606185913086, 24.4904727935791, 26.044883728027344, 27.599294662475586, 29.153705596923828, 30.70811653137207, 32.26252746582031, 33.81694030761719, 35.3713493347168, 36.925758361816406, 38.48017120361328, 40.034584045410156, 41.588993072509766, 43.143402099609375, 44.69781494140625, 46.252227783203125, 47.806636810302734, 49.361045837402344, 50.91545867919922, 52.469871520996094, 54.0242805480957, 55.57868957519531, 57.13310241699219, 58.68751525878906, 60.24192428588867, 61.79633331298828, 63.350746154785156, 64.90515899658203, 66.45956420898438, 68.01397705078125, 69.56838989257812]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 13.0, 10.0, 29.0, 36.0, 71.0, 141.0, 353.0, 1084.0, 4017.0, 21218.0, 348811.0, 3736339.0, 69912.0, 8674.0, 2060.0, 717.0, 314.0, 155.0, 106.0, 52.0, 29.0, 39.0, 29.0, 13.0, 19.0, 9.0, 6.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.390625, -15.492919921875, -14.59521484375, -13.697509765625, -12.7998046875, -11.902099609375, -11.00439453125, -10.106689453125, -9.208984375, -8.311279296875, -7.41357421875, -6.515869140625, -5.6181640625, -4.720458984375, -3.82275390625, -2.925048828125, -2.02734375, -1.129638671875, -0.23193359375, 0.665771484375, 1.5634765625, 2.461181640625, 3.35888671875, 4.256591796875, 5.154296875, 6.052001953125, 6.94970703125, 7.847412109375, 8.7451171875, 9.642822265625, 10.54052734375, 11.438232421875, 12.3359375, 13.233642578125, 14.13134765625, 15.029052734375, 15.9267578125, 16.824462890625, 17.72216796875, 18.619873046875, 19.517578125, 20.415283203125, 21.31298828125, 22.210693359375, 23.1083984375, 24.006103515625, 24.90380859375, 25.801513671875, 26.69921875, 27.596923828125, 28.49462890625, 29.392333984375, 30.2900390625, 31.187744140625, 32.08544921875, 32.983154296875, 33.880859375, 34.778564453125, 35.67626953125, 36.573974609375, 37.4716796875, 38.369384765625, 39.26708984375, 40.164794921875, 41.0625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 2.0, 2.0, 11.0, 20.0, 40.0, 58.0, 79.0, 105.0, 133.0, 134.0, 140.0, 88.0, 75.0, 41.0, 30.0, 25.0, 16.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8720703125, -1.7754974365234375, -1.678924560546875, -1.5823516845703125, -1.48577880859375, -1.3892059326171875, -1.292633056640625, -1.1960601806640625, -1.0994873046875, -1.0029144287109375, -0.906341552734375, -0.8097686767578125, -0.71319580078125, -0.6166229248046875, -0.520050048828125, -0.4234771728515625, -0.326904296875, -0.2303314208984375, -0.133758544921875, -0.0371856689453125, 0.05938720703125, 0.1559600830078125, 0.252532958984375, 0.3491058349609375, 0.4456787109375, 0.5422515869140625, 0.638824462890625, 0.7353973388671875, 0.83197021484375, 0.9285430908203125, 1.025115966796875, 1.1216888427734375, 1.21826171875, 1.3148345947265625, 1.411407470703125, 1.5079803466796875, 1.60455322265625, 1.7011260986328125, 1.797698974609375, 1.8942718505859375, 1.9908447265625, 2.0874176025390625, 2.183990478515625, 2.2805633544921875, 2.37713623046875, 2.4737091064453125, 2.570281982421875, 2.6668548583984375, 2.763427734375, 2.8600006103515625, 2.956573486328125, 3.0531463623046875, 3.14971923828125, 3.2462921142578125, 3.342864990234375, 3.4394378662109375, 3.5360107421875, 3.6325836181640625, 3.729156494140625, 3.8257293701171875, 3.92230224609375, 4.0188751220703125, 4.115447998046875, 4.2120208740234375, 4.30859375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 7.0, 8.0, 13.0, 21.0, 19.0, 62.0, 78.0, 126.0, 304.0, 1100.0, 7617.0, 1344472.0, 2828549.0, 9570.0, 1497.0, 393.0, 154.0, 83.0, 75.0, 48.0, 29.0, 30.0, 8.0, 8.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-78.875, -76.80029296875, -74.7255859375, -72.65087890625, -70.576171875, -68.50146484375, -66.4267578125, -64.35205078125, -62.27734375, -60.20263671875, -58.1279296875, -56.05322265625, -53.978515625, -51.90380859375, -49.8291015625, -47.75439453125, -45.6796875, -43.60498046875, -41.5302734375, -39.45556640625, -37.380859375, -35.30615234375, -33.2314453125, -31.15673828125, -29.08203125, -27.00732421875, -24.9326171875, -22.85791015625, -20.783203125, -18.70849609375, -16.6337890625, -14.55908203125, -12.484375, -10.40966796875, -8.3349609375, -6.26025390625, -4.185546875, -2.11083984375, -0.0361328125, 2.03857421875, 4.11328125, 6.18798828125, 8.2626953125, 10.33740234375, 12.412109375, 14.48681640625, 16.5615234375, 18.63623046875, 20.7109375, 22.78564453125, 24.8603515625, 26.93505859375, 29.009765625, 31.08447265625, 33.1591796875, 35.23388671875, 37.30859375, 39.38330078125, 41.4580078125, 43.53271484375, 45.607421875, 47.68212890625, 49.7568359375, 51.83154296875, 53.90625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 10.0, 48.0, 109.0, 348.0, 2198.0, 983.0, 216.0, 78.0, 35.0, 9.0, 15.0, 10.0, 4.0, 5.0, 1.0, 0.0, 4.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.75390625, -6.29754638671875, -5.8411865234375, -5.38482666015625, -4.928466796875, -4.47210693359375, -4.0157470703125, -3.55938720703125, -3.10302734375, -2.64666748046875, -2.1903076171875, -1.73394775390625, -1.277587890625, -0.82122802734375, -0.3648681640625, 0.09149169921875, 0.5478515625, 1.00421142578125, 1.4605712890625, 1.91693115234375, 2.373291015625, 2.82965087890625, 3.2860107421875, 3.74237060546875, 4.19873046875, 4.65509033203125, 5.1114501953125, 5.56781005859375, 6.024169921875, 6.48052978515625, 6.9368896484375, 7.39324951171875, 7.849609375, 8.30596923828125, 8.7623291015625, 9.21868896484375, 9.675048828125, 10.13140869140625, 10.5877685546875, 11.04412841796875, 11.50048828125, 11.95684814453125, 12.4132080078125, 12.86956787109375, 13.325927734375, 13.78228759765625, 14.2386474609375, 14.69500732421875, 15.1513671875, 15.60772705078125, 16.0640869140625, 16.52044677734375, 16.976806640625, 17.43316650390625, 17.8895263671875, 18.34588623046875, 18.80224609375, 19.25860595703125, 19.7149658203125, 20.17132568359375, 20.627685546875, 21.08404541015625, 21.5404052734375, 21.99676513671875, 22.453125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 5.0, 8.0, 69.0, 287.0, 446.0, 136.0, 31.0, 11.0, 7.0, 1.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.3511962890625, -96.06861877441406, -90.7860336303711, -85.50345611572266, -80.22087097167969, -74.93829345703125, -69.65571594238281, -64.37313842773438, -59.090553283691406, -53.8079719543457, -48.525390625, -43.24281311035156, -37.96023178100586, -32.677650451660156, -27.395071029663086, -22.112491607666016, -16.829910278320312, -11.547329902648926, -6.264749526977539, -0.9821691513061523, 4.300411224365234, 9.582992553710938, 14.865571975708008, 20.148151397705078, 25.43073272705078, 30.713314056396484, 35.99589538574219, 41.278472900390625, 46.56105422973633, 51.84363555908203, 57.12621307373047, 62.40879440307617, 67.69137573242188, 72.97395324707031, 78.25653839111328, 83.53911590576172, 88.82170104980469, 94.10427856445312, 99.38685607910156, 104.66943359375, 109.95201873779297, 115.2345962524414, 120.51718139648438, 125.79975891113281, 131.08233642578125, 136.36492919921875, 141.6475067138672, 146.93008422851562, 152.21266174316406, 157.4952392578125, 162.77781677246094, 168.06040954589844, 173.34298706054688, 178.6255645751953, 183.90814208984375, 189.1907196044922, 194.47329711914062, 199.75587463378906, 205.0384521484375, 210.321044921875, 215.60362243652344, 220.88619995117188, 226.1687774658203, 231.45135498046875, 236.73394775390625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 10.0, 19.0, 35.0, 55.0, 95.0, 119.0, 141.0, 156.0, 114.0, 90.0, 70.0, 42.0, 33.0, 13.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.34202575683594, -66.94820404052734, -64.55438995361328, -62.16056823730469, -59.76675033569336, -57.37293243408203, -54.97911071777344, -52.58529281616211, -50.19147491455078, -47.79765701293945, -45.40383529663086, -43.01001739501953, -40.6161994934082, -38.222381591796875, -35.82855987548828, -33.43474197387695, -31.04092025756836, -28.6471004486084, -26.25328254699707, -23.85946273803711, -21.46564483642578, -19.07182502746582, -16.67800521850586, -14.284187316894531, -11.89036750793457, -9.496548652648926, -7.102729320526123, -4.70890998840332, -2.315091133117676, 0.07872772216796875, 2.4725475311279297, 4.866365432739258, 7.260185241699219, 9.654004096984863, 12.047822952270508, 14.441642761230469, 16.835460662841797, 19.229280471801758, 21.62310028076172, 24.016918182373047, 26.410737991333008, 28.80455780029297, 31.198375701904297, 33.592193603515625, 35.98601531982422, 38.37983322143555, 40.773651123046875, 43.16747283935547, 45.5612907409668, 47.955108642578125, 50.34893035888672, 52.74274826049805, 55.136566162109375, 57.53038787841797, 59.9242057800293, 62.318023681640625, 64.71184539794922, 67.10566711425781, 69.49948120117188, 71.89330291748047, 74.28712463378906, 76.68093872070312, 79.07476043701172, 81.46858215332031, 83.86239624023438]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 15.0, 9.0, 13.0, 21.0, 25.0, 26.0, 38.0, 42.0, 52.0, 76.0, 104.0, 157.0, 226.0, 334.0, 626.0, 1289.0, 3075.0, 10008.0, 38754.0, 185599.0, 533960.0, 212223.0, 44057.0, 11136.0, 3524.0, 1355.0, 641.0, 386.0, 240.0, 152.0, 93.0, 68.0, 44.0, 45.0, 27.0, 22.0, 25.0, 15.0, 10.0, 11.0, 9.0, 5.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-19.109375, -18.55615234375, -18.0029296875, -17.44970703125, -16.896484375, -16.34326171875, -15.7900390625, -15.23681640625, -14.68359375, -14.13037109375, -13.5771484375, -13.02392578125, -12.470703125, -11.91748046875, -11.3642578125, -10.81103515625, -10.2578125, -9.70458984375, -9.1513671875, -8.59814453125, -8.044921875, -7.49169921875, -6.9384765625, -6.38525390625, -5.83203125, -5.27880859375, -4.7255859375, -4.17236328125, -3.619140625, -3.06591796875, -2.5126953125, -1.95947265625, -1.40625, -0.85302734375, -0.2998046875, 0.25341796875, 0.806640625, 1.35986328125, 1.9130859375, 2.46630859375, 3.01953125, 3.57275390625, 4.1259765625, 4.67919921875, 5.232421875, 5.78564453125, 6.3388671875, 6.89208984375, 7.4453125, 7.99853515625, 8.5517578125, 9.10498046875, 9.658203125, 10.21142578125, 10.7646484375, 11.31787109375, 11.87109375, 12.42431640625, 12.9775390625, 13.53076171875, 14.083984375, 14.63720703125, 15.1904296875, 15.74365234375, 16.296875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 13.0, 15.0, 30.0, 55.0, 78.0, 108.0, 124.0, 142.0, 117.0, 118.0, 65.0, 64.0, 28.0, 21.0, 11.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.3515625, -3.225341796875, -3.09912109375, -2.972900390625, -2.8466796875, -2.720458984375, -2.59423828125, -2.468017578125, -2.341796875, -2.215576171875, -2.08935546875, -1.963134765625, -1.8369140625, -1.710693359375, -1.58447265625, -1.458251953125, -1.33203125, -1.205810546875, -1.07958984375, -0.953369140625, -0.8271484375, -0.700927734375, -0.57470703125, -0.448486328125, -0.322265625, -0.196044921875, -0.06982421875, 0.056396484375, 0.1826171875, 0.308837890625, 0.43505859375, 0.561279296875, 0.6875, 0.813720703125, 0.93994140625, 1.066162109375, 1.1923828125, 1.318603515625, 1.44482421875, 1.571044921875, 1.697265625, 1.823486328125, 1.94970703125, 2.075927734375, 2.2021484375, 2.328369140625, 2.45458984375, 2.580810546875, 2.70703125, 2.833251953125, 2.95947265625, 3.085693359375, 3.2119140625, 3.338134765625, 3.46435546875, 3.590576171875, 3.716796875, 3.843017578125, 3.96923828125, 4.095458984375, 4.2216796875, 4.347900390625, 4.47412109375, 4.600341796875, 4.7265625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 7.0, 2.0, 7.0, 11.0, 12.0, 16.0, 25.0, 34.0, 36.0, 60.0, 94.0, 124.0, 178.0, 300.0, 487.0, 749.0, 1320.0, 2439.0, 5144.0, 12016.0, 30023.0, 85273.0, 230522.0, 367812.0, 195768.0, 70409.0, 25519.0, 10243.0, 4539.0, 2239.0, 1218.0, 645.0, 431.0, 291.0, 166.0, 124.0, 85.0, 48.0, 37.0, 28.0, 20.0, 16.0, 18.0, 6.0, 14.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.9296875, -8.6541748046875, -8.378662109375, -8.1031494140625, -7.82763671875, -7.5521240234375, -7.276611328125, -7.0010986328125, -6.7255859375, -6.4500732421875, -6.174560546875, -5.8990478515625, -5.62353515625, -5.3480224609375, -5.072509765625, -4.7969970703125, -4.521484375, -4.2459716796875, -3.970458984375, -3.6949462890625, -3.41943359375, -3.1439208984375, -2.868408203125, -2.5928955078125, -2.3173828125, -2.0418701171875, -1.766357421875, -1.4908447265625, -1.21533203125, -0.9398193359375, -0.664306640625, -0.3887939453125, -0.11328125, 0.1622314453125, 0.437744140625, 0.7132568359375, 0.98876953125, 1.2642822265625, 1.539794921875, 1.8153076171875, 2.0908203125, 2.3663330078125, 2.641845703125, 2.9173583984375, 3.19287109375, 3.4683837890625, 3.743896484375, 4.0194091796875, 4.294921875, 4.5704345703125, 4.845947265625, 5.1214599609375, 5.39697265625, 5.6724853515625, 5.947998046875, 6.2235107421875, 6.4990234375, 6.7745361328125, 7.050048828125, 7.3255615234375, 7.60107421875, 7.8765869140625, 8.152099609375, 8.4276123046875, 8.703125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 11.0, 6.0, 10.0, 9.0, 13.0, 10.0, 10.0, 18.0, 24.0, 18.0, 26.0, 22.0, 30.0, 39.0, 27.0, 29.0, 47.0, 40.0, 37.0, 32.0, 49.0, 54.0, 32.0, 37.0, 47.0, 26.0, 29.0, 32.0, 32.0, 21.0, 31.0, 17.0, 19.0, 22.0, 16.0, 11.0, 7.0, 15.0, 14.0, 5.0, 3.0, 8.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-5.421875, -5.25201416015625, -5.0821533203125, -4.91229248046875, -4.742431640625, -4.57257080078125, -4.4027099609375, -4.23284912109375, -4.06298828125, -3.89312744140625, -3.7232666015625, -3.55340576171875, -3.383544921875, -3.21368408203125, -3.0438232421875, -2.87396240234375, -2.7041015625, -2.53424072265625, -2.3643798828125, -2.19451904296875, -2.024658203125, -1.85479736328125, -1.6849365234375, -1.51507568359375, -1.34521484375, -1.17535400390625, -1.0054931640625, -0.83563232421875, -0.665771484375, -0.49591064453125, -0.3260498046875, -0.15618896484375, 0.013671875, 0.18353271484375, 0.3533935546875, 0.52325439453125, 0.693115234375, 0.86297607421875, 1.0328369140625, 1.20269775390625, 1.37255859375, 1.54241943359375, 1.7122802734375, 1.88214111328125, 2.052001953125, 2.22186279296875, 2.3917236328125, 2.56158447265625, 2.7314453125, 2.90130615234375, 3.0711669921875, 3.24102783203125, 3.410888671875, 3.58074951171875, 3.7506103515625, 3.92047119140625, 4.09033203125, 4.26019287109375, 4.4300537109375, 4.59991455078125, 4.769775390625, 4.93963623046875, 5.1094970703125, 5.27935791015625, 5.44921875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 7.0, 9.0, 19.0, 21.0, 28.0, 69.0, 108.0, 193.0, 302.0, 500.0, 1193.0, 3136.0, 10352.0, 57363.0, 568126.0, 360630.0, 34721.0, 7319.0, 2367.0, 973.0, 463.0, 249.0, 159.0, 84.0, 51.0, 40.0, 17.0, 16.0, 13.0, 8.0, 4.0, 0.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6875, -8.4061279296875, -8.124755859375, -7.8433837890625, -7.56201171875, -7.2806396484375, -6.999267578125, -6.7178955078125, -6.4365234375, -6.1551513671875, -5.873779296875, -5.5924072265625, -5.31103515625, -5.0296630859375, -4.748291015625, -4.4669189453125, -4.185546875, -3.9041748046875, -3.622802734375, -3.3414306640625, -3.06005859375, -2.7786865234375, -2.497314453125, -2.2159423828125, -1.9345703125, -1.6531982421875, -1.371826171875, -1.0904541015625, -0.80908203125, -0.5277099609375, -0.246337890625, 0.0350341796875, 0.31640625, 0.5977783203125, 0.879150390625, 1.1605224609375, 1.44189453125, 1.7232666015625, 2.004638671875, 2.2860107421875, 2.5673828125, 2.8487548828125, 3.130126953125, 3.4114990234375, 3.69287109375, 3.9742431640625, 4.255615234375, 4.5369873046875, 4.818359375, 5.0997314453125, 5.381103515625, 5.6624755859375, 5.94384765625, 6.2252197265625, 6.506591796875, 6.7879638671875, 7.0693359375, 7.3507080078125, 7.632080078125, 7.9134521484375, 8.19482421875, 8.4761962890625, 8.757568359375, 9.0389404296875, 9.3203125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 9.0, 7.0, 11.0, 18.0, 33.0, 42.0, 68.0, 112.0, 135.0, 148.0, 120.0, 104.0, 62.0, 46.0, 32.0, 22.0, 12.0, 6.0, 9.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0019893646240234375, -0.0019474923610687256, -0.0019056200981140137, -0.0018637478351593018, -0.0018218755722045898, -0.001780003309249878, -0.001738131046295166, -0.001696258783340454, -0.0016543865203857422, -0.0016125142574310303, -0.0015706419944763184, -0.0015287697315216064, -0.0014868974685668945, -0.0014450252056121826, -0.0014031529426574707, -0.0013612806797027588, -0.0013194084167480469, -0.001277536153793335, -0.001235663890838623, -0.0011937916278839111, -0.0011519193649291992, -0.0011100471019744873, -0.0010681748390197754, -0.0010263025760650635, -0.0009844303131103516, -0.0009425580501556396, -0.0009006857872009277, -0.0008588135242462158, -0.0008169412612915039, -0.000775068998336792, -0.0007331967353820801, -0.0006913244724273682, -0.0006494522094726562, -0.0006075799465179443, -0.0005657076835632324, -0.0005238354206085205, -0.0004819631576538086, -0.0004400908946990967, -0.00039821863174438477, -0.00035634636878967285, -0.00031447410583496094, -0.000272601842880249, -0.0002307295799255371, -0.0001888573169708252, -0.00014698505401611328, -0.00010511279106140137, -6.324052810668945e-05, -2.136826515197754e-05, 2.0503997802734375e-05, 6.237626075744629e-05, 0.0001042485237121582, 0.00014612078666687012, 0.00018799304962158203, 0.00022986531257629395, 0.00027173757553100586, 0.0003136098384857178, 0.0003554821014404297, 0.0003973543643951416, 0.0004392266273498535, 0.00048109889030456543, 0.0005229711532592773, 0.0005648434162139893, 0.0006067156791687012, 0.0006485879421234131, 0.000690460205078125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 12.0, 18.0, 23.0, 21.0, 34.0, 57.0, 98.0, 164.0, 244.0, 413.0, 850.0, 1675.0, 4162.0, 12799.0, 77621.0, 646728.0, 264580.0, 26865.0, 6879.0, 2593.0, 1216.0, 601.0, 333.0, 205.0, 115.0, 68.0, 47.0, 40.0, 14.0, 17.0, 14.0, 10.0, 5.0, 2.0, 6.0, 4.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.76953125, -7.51678466796875, -7.2640380859375, -7.01129150390625, -6.758544921875, -6.50579833984375, -6.2530517578125, -6.00030517578125, -5.74755859375, -5.49481201171875, -5.2420654296875, -4.98931884765625, -4.736572265625, -4.48382568359375, -4.2310791015625, -3.97833251953125, -3.7255859375, -3.47283935546875, -3.2200927734375, -2.96734619140625, -2.714599609375, -2.46185302734375, -2.2091064453125, -1.95635986328125, -1.70361328125, -1.45086669921875, -1.1981201171875, -0.94537353515625, -0.692626953125, -0.43988037109375, -0.1871337890625, 0.06561279296875, 0.318359375, 0.57110595703125, 0.8238525390625, 1.07659912109375, 1.329345703125, 1.58209228515625, 1.8348388671875, 2.08758544921875, 2.34033203125, 2.59307861328125, 2.8458251953125, 3.09857177734375, 3.351318359375, 3.60406494140625, 3.8568115234375, 4.10955810546875, 4.3623046875, 4.61505126953125, 4.8677978515625, 5.12054443359375, 5.373291015625, 5.62603759765625, 5.8787841796875, 6.13153076171875, 6.38427734375, 6.63702392578125, 6.8897705078125, 7.14251708984375, 7.395263671875, 7.64801025390625, 7.9007568359375, 8.15350341796875, 8.40625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 8.0, 10.0, 12.0, 17.0, 20.0, 40.0, 48.0, 76.0, 91.0, 109.0, 120.0, 117.0, 118.0, 69.0, 58.0, 19.0, 12.0, 21.0, 14.0, 7.0, 7.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.1640625, -6.950439453125, -6.73681640625, -6.523193359375, -6.3095703125, -6.095947265625, -5.88232421875, -5.668701171875, -5.455078125, -5.241455078125, -5.02783203125, -4.814208984375, -4.6005859375, -4.386962890625, -4.17333984375, -3.959716796875, -3.74609375, -3.532470703125, -3.31884765625, -3.105224609375, -2.8916015625, -2.677978515625, -2.46435546875, -2.250732421875, -2.037109375, -1.823486328125, -1.60986328125, -1.396240234375, -1.1826171875, -0.968994140625, -0.75537109375, -0.541748046875, -0.328125, -0.114501953125, 0.09912109375, 0.312744140625, 0.5263671875, 0.739990234375, 0.95361328125, 1.167236328125, 1.380859375, 1.594482421875, 1.80810546875, 2.021728515625, 2.2353515625, 2.448974609375, 2.66259765625, 2.876220703125, 3.08984375, 3.303466796875, 3.51708984375, 3.730712890625, 3.9443359375, 4.157958984375, 4.37158203125, 4.585205078125, 4.798828125, 5.012451171875, 5.22607421875, 5.439697265625, 5.6533203125, 5.866943359375, 6.08056640625, 6.294189453125, 6.5078125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 9.0, 21.0, 28.0, 36.0, 70.0, 100.0, 168.0, 197.0, 149.0, 106.0, 59.0, 29.0, 13.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.25228881835938, -81.07689666748047, -77.9015121459961, -74.72611999511719, -71.55073547363281, -68.3753433227539, -65.199951171875, -62.024566650390625, -58.84917449951172, -55.67378616333008, -52.49839782714844, -49.32300567626953, -46.14761734008789, -42.97222900390625, -39.79684066772461, -36.62145233154297, -33.44606399536133, -30.270675659179688, -27.095285415649414, -23.919897079467773, -20.7445068359375, -17.56911849975586, -14.393730163574219, -11.218339920043945, -8.042951583862305, -4.867562294006348, -1.6921734809875488, 1.48321533203125, 4.658604621887207, 7.833993911743164, 11.009382247924805, 14.184772491455078, 17.36016082763672, 20.53554916381836, 23.710939407348633, 26.886327743530273, 30.061717987060547, 33.23710632324219, 36.41249465942383, 39.58788299560547, 42.763275146484375, 45.938663482666016, 49.114051818847656, 52.28944396972656, 55.4648323059082, 58.640220642089844, 61.815608978271484, 64.99099731445312, 68.1663818359375, 71.3417739868164, 74.51715850830078, 77.69255065917969, 80.86793518066406, 84.04332733154297, 87.21871948242188, 90.39410400390625, 93.56949615478516, 96.74488830566406, 99.92027282714844, 103.09566497802734, 106.27104949951172, 109.44644165039062, 112.621826171875, 115.7972183227539, 118.97261047363281]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 8.0, 4.0, 6.0, 3.0, 9.0, 9.0, 17.0, 10.0, 16.0, 14.0, 17.0, 18.0, 24.0, 28.0, 32.0, 34.0, 41.0, 40.0, 42.0, 35.0, 35.0, 45.0, 47.0, 56.0, 42.0, 51.0, 38.0, 40.0, 28.0, 20.0, 24.0, 23.0, 20.0, 22.0, 21.0, 23.0, 18.0, 11.0, 8.0, 12.0, 8.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.19033432006836, -33.08357238769531, -31.976806640625, -30.87004280090332, -29.76327896118164, -28.65651512145996, -27.54975128173828, -26.4429874420166, -25.336223602294922, -24.229459762573242, -23.122695922851562, -22.015932083129883, -20.909168243408203, -19.802404403686523, -18.695640563964844, -17.588876724243164, -16.482112884521484, -15.375349044799805, -14.268585205078125, -13.161821365356445, -12.055057525634766, -10.948293685913086, -9.841529846191406, -8.734766006469727, -7.628002166748047, -6.521238327026367, -5.4144744873046875, -4.307710647583008, -3.200946807861328, -2.0941829681396484, -0.9874191284179688, 0.11934471130371094, 1.226104736328125, 2.3328685760498047, 3.4396324157714844, 4.546396255493164, 5.653160095214844, 6.759923934936523, 7.866687774658203, 8.973451614379883, 10.080215454101562, 11.186979293823242, 12.293743133544922, 13.400506973266602, 14.507270812988281, 15.614034652709961, 16.72079849243164, 17.82756233215332, 18.934326171875, 20.04109001159668, 21.14785385131836, 22.25461769104004, 23.36138153076172, 24.4681453704834, 25.574909210205078, 26.681673049926758, 27.788436889648438, 28.895200729370117, 30.001964569091797, 31.108728408813477, 32.215492248535156, 33.32225799560547, 34.429019927978516, 35.53578186035156, 36.642547607421875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 9.0, 10.0, 22.0, 37.0, 68.0, 137.0, 347.0, 931.0, 3195.0, 18720.0, 355908.0, 3757283.0, 48359.0, 6291.0, 1654.0, 644.0, 273.0, 141.0, 87.0, 57.0, 26.0, 30.0, 13.0, 9.0, 7.0, 11.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9765625, -13.2489013671875, -12.521240234375, -11.7935791015625, -11.06591796875, -10.3382568359375, -9.610595703125, -8.8829345703125, -8.1552734375, -7.4276123046875, -6.699951171875, -5.9722900390625, -5.24462890625, -4.5169677734375, -3.789306640625, -3.0616455078125, -2.333984375, -1.6063232421875, -0.878662109375, -0.1510009765625, 0.57666015625, 1.3043212890625, 2.031982421875, 2.7596435546875, 3.4873046875, 4.2149658203125, 4.942626953125, 5.6702880859375, 6.39794921875, 7.1256103515625, 7.853271484375, 8.5809326171875, 9.30859375, 10.0362548828125, 10.763916015625, 11.4915771484375, 12.21923828125, 12.9468994140625, 13.674560546875, 14.4022216796875, 15.1298828125, 15.8575439453125, 16.585205078125, 17.3128662109375, 18.04052734375, 18.7681884765625, 19.495849609375, 20.2235107421875, 20.951171875, 21.6788330078125, 22.406494140625, 23.1341552734375, 23.86181640625, 24.5894775390625, 25.317138671875, 26.0447998046875, 26.7724609375, 27.5001220703125, 28.227783203125, 28.9554443359375, 29.68310546875, 30.4107666015625, 31.138427734375, 31.8660888671875, 32.59375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 6.0, 11.0, 13.0, 23.0, 47.0, 83.0, 70.0, 117.0, 127.0, 114.0, 105.0, 76.0, 79.0, 45.0, 42.0, 12.0, 11.0, 9.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.9921875, -2.87310791015625, -2.7540283203125, -2.63494873046875, -2.515869140625, -2.39678955078125, -2.2777099609375, -2.15863037109375, -2.03955078125, -1.92047119140625, -1.8013916015625, -1.68231201171875, -1.563232421875, -1.44415283203125, -1.3250732421875, -1.20599365234375, -1.0869140625, -0.96783447265625, -0.8487548828125, -0.72967529296875, -0.610595703125, -0.49151611328125, -0.3724365234375, -0.25335693359375, -0.13427734375, -0.01519775390625, 0.1038818359375, 0.22296142578125, 0.342041015625, 0.46112060546875, 0.5802001953125, 0.69927978515625, 0.818359375, 0.93743896484375, 1.0565185546875, 1.17559814453125, 1.294677734375, 1.41375732421875, 1.5328369140625, 1.65191650390625, 1.77099609375, 1.89007568359375, 2.0091552734375, 2.12823486328125, 2.247314453125, 2.36639404296875, 2.4854736328125, 2.60455322265625, 2.7236328125, 2.84271240234375, 2.9617919921875, 3.08087158203125, 3.199951171875, 3.31903076171875, 3.4381103515625, 3.55718994140625, 3.67626953125, 3.79534912109375, 3.9144287109375, 4.03350830078125, 4.152587890625, 4.27166748046875, 4.3907470703125, 4.50982666015625, 4.62890625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 7.0, 6.0, 14.0, 14.0, 12.0, 20.0, 15.0, 24.0, 41.0, 38.0, 38.0, 44.0, 60.0, 100.0, 301.0, 1708.0, 64095.0, 4114409.0, 12101.0, 770.0, 142.0, 80.0, 42.0, 46.0, 30.0, 28.0, 23.0, 19.0, 15.0, 13.0, 7.0, 6.0, 7.0, 2.0, 0.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.9375, -47.32421875, -45.7109375, -44.09765625, -42.484375, -40.87109375, -39.2578125, -37.64453125, -36.03125, -34.41796875, -32.8046875, -31.19140625, -29.578125, -27.96484375, -26.3515625, -24.73828125, -23.125, -21.51171875, -19.8984375, -18.28515625, -16.671875, -15.05859375, -13.4453125, -11.83203125, -10.21875, -8.60546875, -6.9921875, -5.37890625, -3.765625, -2.15234375, -0.5390625, 1.07421875, 2.6875, 4.30078125, 5.9140625, 7.52734375, 9.140625, 10.75390625, 12.3671875, 13.98046875, 15.59375, 17.20703125, 18.8203125, 20.43359375, 22.046875, 23.66015625, 25.2734375, 26.88671875, 28.5, 30.11328125, 31.7265625, 33.33984375, 34.953125, 36.56640625, 38.1796875, 39.79296875, 41.40625, 43.01953125, 44.6328125, 46.24609375, 47.859375, 49.47265625, 51.0859375, 52.69921875, 54.3125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 16.0, 46.0, 170.0, 1560.0, 2078.0, 169.0, 27.0, 12.0, 2.0, 1.0, 0.0, 2.0], "bins": [-29.5, -28.97344970703125, -28.4468994140625, -27.92034912109375, -27.393798828125, -26.86724853515625, -26.3406982421875, -25.81414794921875, -25.28759765625, -24.76104736328125, -24.2344970703125, -23.70794677734375, -23.181396484375, -22.65484619140625, -22.1282958984375, -21.60174560546875, -21.0751953125, -20.54864501953125, -20.0220947265625, -19.49554443359375, -18.968994140625, -18.44244384765625, -17.9158935546875, -17.38934326171875, -16.86279296875, -16.33624267578125, -15.8096923828125, -15.28314208984375, -14.756591796875, -14.23004150390625, -13.7034912109375, -13.17694091796875, -12.650390625, -12.12384033203125, -11.5972900390625, -11.07073974609375, -10.544189453125, -10.01763916015625, -9.4910888671875, -8.96453857421875, -8.43798828125, -7.91143798828125, -7.3848876953125, -6.85833740234375, -6.331787109375, -5.80523681640625, -5.2786865234375, -4.75213623046875, -4.2255859375, -3.69903564453125, -3.1724853515625, -2.64593505859375, -2.119384765625, -1.59283447265625, -1.0662841796875, -0.53973388671875, -0.01318359375, 0.51336669921875, 1.0399169921875, 1.56646728515625, 2.093017578125, 2.61956787109375, 3.1461181640625, 3.67266845703125, 4.19921875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 16.0, 93.0, 426.0, 391.0, 57.0, 11.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-150.81497192382812, -146.84622192382812, -142.87745666503906, -138.90870666503906, -134.93994140625, -130.97119140625, -127.00243377685547, -123.03367614746094, -119.0649185180664, -115.09616088867188, -111.12740325927734, -107.15864562988281, -103.18989562988281, -99.22113037109375, -95.25238037109375, -91.28362274169922, -87.31486511230469, -83.34610748291016, -79.37734985351562, -75.4085922241211, -71.43983459472656, -67.47108459472656, -63.50232696533203, -59.5335693359375, -55.56481170654297, -51.59605407714844, -47.627296447753906, -43.65854263305664, -39.68978500366211, -35.72102737426758, -31.75227165222168, -27.78351593017578, -23.81476593017578, -19.84600830078125, -15.877252578735352, -11.908495903015137, -7.939739227294922, -3.9709815979003906, -0.0022258758544921875, 3.9665298461914062, 7.9352874755859375, 11.904044151306152, 15.872800827026367, 19.841556549072266, 23.810314178466797, 27.779071807861328, 31.747827529907227, 35.716583251953125, 39.685340881347656, 43.65409851074219, 47.62285614013672, 51.591609954833984, 55.560367584228516, 59.52912521362305, 63.49787902832031, 67.46663665771484, 71.43539428710938, 75.4041519165039, 79.37290954589844, 83.34166717529297, 87.3104248046875, 91.2791748046875, 95.24793243408203, 99.21669006347656, 103.1854476928711]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 10.0, 26.0, 52.0, 93.0, 151.0, 170.0, 185.0, 140.0, 90.0, 57.0, 24.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.6444091796875, -63.58757781982422, -61.53074645996094, -59.473915100097656, -57.417083740234375, -55.360252380371094, -53.30342102050781, -51.24658966064453, -49.18975830078125, -47.13292694091797, -45.07609558105469, -43.019264221191406, -40.962432861328125, -38.905601501464844, -36.84877014160156, -34.79193878173828, -32.735107421875, -30.67827606201172, -28.621444702148438, -26.564613342285156, -24.507781982421875, -22.450950622558594, -20.394119262695312, -18.33728790283203, -16.28045654296875, -14.223625183105469, -12.166793823242188, -10.109962463378906, -8.053131103515625, -5.996299743652344, -3.9394683837890625, -1.8826370239257812, 0.17420196533203125, 2.2310333251953125, 4.287864685058594, 6.344696044921875, 8.401527404785156, 10.458358764648438, 12.515190124511719, 14.572021484375, 16.62885284423828, 18.685684204101562, 20.742515563964844, 22.799346923828125, 24.856178283691406, 26.913009643554688, 28.96984100341797, 31.02667236328125, 33.08350372314453, 35.14033508300781, 37.197166442871094, 39.253997802734375, 41.310829162597656, 43.36766052246094, 45.42449188232422, 47.4813232421875, 49.53815460205078, 51.59498596191406, 53.651817321777344, 55.708648681640625, 57.765480041503906, 59.82231140136719, 61.87914276123047, 63.93597412109375, 65.99280548095703]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 2.0, 5.0, 8.0, 15.0, 19.0, 19.0, 44.0, 70.0, 131.0, 169.0, 291.0, 574.0, 1133.0, 2516.0, 6802.0, 24285.0, 108197.0, 434697.0, 358782.0, 82185.0, 18589.0, 5654.0, 2177.0, 947.0, 517.0, 294.0, 159.0, 105.0, 59.0, 37.0, 28.0, 22.0, 7.0, 9.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-20.703125, -20.1422119140625, -19.581298828125, -19.0203857421875, -18.45947265625, -17.8985595703125, -17.337646484375, -16.7767333984375, -16.2158203125, -15.6549072265625, -15.093994140625, -14.5330810546875, -13.97216796875, -13.4112548828125, -12.850341796875, -12.2894287109375, -11.728515625, -11.1676025390625, -10.606689453125, -10.0457763671875, -9.48486328125, -8.9239501953125, -8.363037109375, -7.8021240234375, -7.2412109375, -6.6802978515625, -6.119384765625, -5.5584716796875, -4.99755859375, -4.4366455078125, -3.875732421875, -3.3148193359375, -2.75390625, -2.1929931640625, -1.632080078125, -1.0711669921875, -0.51025390625, 0.0506591796875, 0.611572265625, 1.1724853515625, 1.7333984375, 2.2943115234375, 2.855224609375, 3.4161376953125, 3.97705078125, 4.5379638671875, 5.098876953125, 5.6597900390625, 6.220703125, 6.7816162109375, 7.342529296875, 7.9034423828125, 8.46435546875, 9.0252685546875, 9.586181640625, 10.1470947265625, 10.7080078125, 11.2689208984375, 11.829833984375, 12.3907470703125, 12.95166015625, 13.5125732421875, 14.073486328125, 14.6343994140625, 15.1953125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 5.0, 2.0, 9.0, 16.0, 22.0, 58.0, 56.0, 71.0, 105.0, 104.0, 115.0, 108.0, 92.0, 77.0, 59.0, 38.0, 22.0, 17.0, 9.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9375, -2.830322265625, -2.72314453125, -2.615966796875, -2.5087890625, -2.401611328125, -2.29443359375, -2.187255859375, -2.080078125, -1.972900390625, -1.86572265625, -1.758544921875, -1.6513671875, -1.544189453125, -1.43701171875, -1.329833984375, -1.22265625, -1.115478515625, -1.00830078125, -0.901123046875, -0.7939453125, -0.686767578125, -0.57958984375, -0.472412109375, -0.365234375, -0.258056640625, -0.15087890625, -0.043701171875, 0.0634765625, 0.170654296875, 0.27783203125, 0.385009765625, 0.4921875, 0.599365234375, 0.70654296875, 0.813720703125, 0.9208984375, 1.028076171875, 1.13525390625, 1.242431640625, 1.349609375, 1.456787109375, 1.56396484375, 1.671142578125, 1.7783203125, 1.885498046875, 1.99267578125, 2.099853515625, 2.20703125, 2.314208984375, 2.42138671875, 2.528564453125, 2.6357421875, 2.742919921875, 2.85009765625, 2.957275390625, 3.064453125, 3.171630859375, 3.27880859375, 3.385986328125, 3.4931640625, 3.600341796875, 3.70751953125, 3.814697265625, 3.921875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 5.0, 3.0, 7.0, 13.0, 13.0, 11.0, 23.0, 27.0, 25.0, 56.0, 74.0, 95.0, 115.0, 159.0, 244.0, 319.0, 455.0, 654.0, 1115.0, 1816.0, 3374.0, 6712.0, 14216.0, 31883.0, 75539.0, 175481.0, 308796.0, 235358.0, 107724.0, 45114.0, 19460.0, 8927.0, 4426.0, 2334.0, 1347.0, 819.0, 547.0, 379.0, 228.0, 183.0, 123.0, 85.0, 73.0, 59.0, 34.0, 29.0, 22.0, 10.0, 20.0, 10.0, 6.0, 6.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-8.375, -8.118896484375, -7.86279296875, -7.606689453125, -7.3505859375, -7.094482421875, -6.83837890625, -6.582275390625, -6.326171875, -6.070068359375, -5.81396484375, -5.557861328125, -5.3017578125, -5.045654296875, -4.78955078125, -4.533447265625, -4.27734375, -4.021240234375, -3.76513671875, -3.509033203125, -3.2529296875, -2.996826171875, -2.74072265625, -2.484619140625, -2.228515625, -1.972412109375, -1.71630859375, -1.460205078125, -1.2041015625, -0.947998046875, -0.69189453125, -0.435791015625, -0.1796875, 0.076416015625, 0.33251953125, 0.588623046875, 0.8447265625, 1.100830078125, 1.35693359375, 1.613037109375, 1.869140625, 2.125244140625, 2.38134765625, 2.637451171875, 2.8935546875, 3.149658203125, 3.40576171875, 3.661865234375, 3.91796875, 4.174072265625, 4.43017578125, 4.686279296875, 4.9423828125, 5.198486328125, 5.45458984375, 5.710693359375, 5.966796875, 6.222900390625, 6.47900390625, 6.735107421875, 6.9912109375, 7.247314453125, 7.50341796875, 7.759521484375, 8.015625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 0.0, 3.0, 3.0, 7.0, 7.0, 13.0, 12.0, 16.0, 20.0, 26.0, 28.0, 34.0, 39.0, 28.0, 38.0, 45.0, 46.0, 51.0, 54.0, 51.0, 46.0, 38.0, 43.0, 46.0, 57.0, 45.0, 30.0, 28.0, 22.0, 26.0, 21.0, 19.0, 11.0, 13.0, 13.0, 8.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.59765625, -7.376953125, -7.15625, -6.935546875, -6.71484375, -6.494140625, -6.2734375, -6.052734375, -5.83203125, -5.611328125, -5.390625, -5.169921875, -4.94921875, -4.728515625, -4.5078125, -4.287109375, -4.06640625, -3.845703125, -3.625, -3.404296875, -3.18359375, -2.962890625, -2.7421875, -2.521484375, -2.30078125, -2.080078125, -1.859375, -1.638671875, -1.41796875, -1.197265625, -0.9765625, -0.755859375, -0.53515625, -0.314453125, -0.09375, 0.126953125, 0.34765625, 0.568359375, 0.7890625, 1.009765625, 1.23046875, 1.451171875, 1.671875, 1.892578125, 2.11328125, 2.333984375, 2.5546875, 2.775390625, 2.99609375, 3.216796875, 3.4375, 3.658203125, 3.87890625, 4.099609375, 4.3203125, 4.541015625, 4.76171875, 4.982421875, 5.203125, 5.423828125, 5.64453125, 5.865234375, 6.0859375, 6.306640625, 6.52734375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 4.0, 7.0, 3.0, 6.0, 9.0, 14.0, 23.0, 21.0, 36.0, 42.0, 60.0, 84.0, 129.0, 177.0, 303.0, 478.0, 961.0, 2046.0, 4987.0, 14676.0, 58346.0, 395320.0, 473092.0, 70547.0, 16779.0, 5533.0, 2357.0, 1054.0, 556.0, 288.0, 160.0, 127.0, 89.0, 59.0, 41.0, 39.0, 32.0, 28.0, 10.0, 10.0, 7.0, 4.0, 6.0, 4.0, 1.0, 4.0, 4.0, 0.0, 1.0, 1.0], "bins": [-9.21875, -8.96307373046875, -8.7073974609375, -8.45172119140625, -8.196044921875, -7.94036865234375, -7.6846923828125, -7.42901611328125, -7.17333984375, -6.91766357421875, -6.6619873046875, -6.40631103515625, -6.150634765625, -5.89495849609375, -5.6392822265625, -5.38360595703125, -5.1279296875, -4.87225341796875, -4.6165771484375, -4.36090087890625, -4.105224609375, -3.84954833984375, -3.5938720703125, -3.33819580078125, -3.08251953125, -2.82684326171875, -2.5711669921875, -2.31549072265625, -2.059814453125, -1.80413818359375, -1.5484619140625, -1.29278564453125, -1.037109375, -0.78143310546875, -0.5257568359375, -0.27008056640625, -0.014404296875, 0.24127197265625, 0.4969482421875, 0.75262451171875, 1.00830078125, 1.26397705078125, 1.5196533203125, 1.77532958984375, 2.031005859375, 2.28668212890625, 2.5423583984375, 2.79803466796875, 3.0537109375, 3.30938720703125, 3.5650634765625, 3.82073974609375, 4.076416015625, 4.33209228515625, 4.5877685546875, 4.84344482421875, 5.09912109375, 5.35479736328125, 5.6104736328125, 5.86614990234375, 6.121826171875, 6.37750244140625, 6.6331787109375, 6.88885498046875, 7.14453125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 7.0, 4.0, 9.0, 11.0, 17.0, 14.0, 25.0, 21.0, 32.0, 56.0, 67.0, 88.0, 91.0, 107.0, 88.0, 87.0, 76.0, 36.0, 39.0, 32.0, 22.0, 15.0, 13.0, 7.0, 7.0, 6.0, 2.0, 5.0, 2.0, 8.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.000972747802734375, -0.0009440034627914429, -0.0009152591228485107, -0.0008865147829055786, -0.0008577704429626465, -0.0008290261030197144, -0.0008002817630767822, -0.0007715374231338501, -0.000742793083190918, -0.0007140487432479858, -0.0006853044033050537, -0.0006565600633621216, -0.0006278157234191895, -0.0005990713834762573, -0.0005703270435333252, -0.0005415827035903931, -0.0005128383636474609, -0.0004840940237045288, -0.0004553496837615967, -0.00042660534381866455, -0.0003978610038757324, -0.0003691166639328003, -0.00034037232398986816, -0.00031162798404693604, -0.0002828836441040039, -0.0002541393041610718, -0.00022539496421813965, -0.00019665062427520752, -0.0001679062843322754, -0.00013916194438934326, -0.00011041760444641113, -8.1673264503479e-05, -5.2928924560546875e-05, -2.4184584617614746e-05, 4.559755325317383e-06, 3.330409526824951e-05, 6.204843521118164e-05, 9.079277515411377e-05, 0.0001195371150970459, 0.00014828145503997803, 0.00017702579498291016, 0.00020577013492584229, 0.00023451447486877441, 0.00026325881481170654, 0.00029200315475463867, 0.0003207474946975708, 0.00034949183464050293, 0.00037823617458343506, 0.0004069805145263672, 0.0004357248544692993, 0.00046446919441223145, 0.0004932135343551636, 0.0005219578742980957, 0.0005507022142410278, 0.00057944655418396, 0.0006081908941268921, 0.0006369352340698242, 0.0006656795740127563, 0.0006944239139556885, 0.0007231682538986206, 0.0007519125938415527, 0.0007806569337844849, 0.000809401273727417, 0.0008381456136703491, 0.0008668899536132812]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 14.0, 10.0, 29.0, 42.0, 75.0, 95.0, 187.0, 298.0, 623.0, 1953.0, 8306.0, 76427.0, 852507.0, 94814.0, 9614.0, 2089.0, 693.0, 338.0, 187.0, 89.0, 63.0, 42.0, 20.0, 15.0, 12.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6875, -13.2392578125, -12.791015625, -12.3427734375, -11.89453125, -11.4462890625, -10.998046875, -10.5498046875, -10.1015625, -9.6533203125, -9.205078125, -8.7568359375, -8.30859375, -7.8603515625, -7.412109375, -6.9638671875, -6.515625, -6.0673828125, -5.619140625, -5.1708984375, -4.72265625, -4.2744140625, -3.826171875, -3.3779296875, -2.9296875, -2.4814453125, -2.033203125, -1.5849609375, -1.13671875, -0.6884765625, -0.240234375, 0.2080078125, 0.65625, 1.1044921875, 1.552734375, 2.0009765625, 2.44921875, 2.8974609375, 3.345703125, 3.7939453125, 4.2421875, 4.6904296875, 5.138671875, 5.5869140625, 6.03515625, 6.4833984375, 6.931640625, 7.3798828125, 7.828125, 8.2763671875, 8.724609375, 9.1728515625, 9.62109375, 10.0693359375, 10.517578125, 10.9658203125, 11.4140625, 11.8623046875, 12.310546875, 12.7587890625, 13.20703125, 13.6552734375, 14.103515625, 14.5517578125, 15.0]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 2.0, 3.0, 5.0, 8.0, 7.0, 8.0, 11.0, 18.0, 17.0, 24.0, 27.0, 38.0, 35.0, 62.0, 77.0, 89.0, 92.0, 109.0, 97.0, 65.0, 58.0, 33.0, 31.0, 24.0, 14.0, 13.0, 4.0, 8.0, 8.0, 3.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1796875, -5.97833251953125, -5.7769775390625, -5.57562255859375, -5.374267578125, -5.17291259765625, -4.9715576171875, -4.77020263671875, -4.56884765625, -4.36749267578125, -4.1661376953125, -3.96478271484375, -3.763427734375, -3.56207275390625, -3.3607177734375, -3.15936279296875, -2.9580078125, -2.75665283203125, -2.5552978515625, -2.35394287109375, -2.152587890625, -1.95123291015625, -1.7498779296875, -1.54852294921875, -1.34716796875, -1.14581298828125, -0.9444580078125, -0.74310302734375, -0.541748046875, -0.34039306640625, -0.1390380859375, 0.06231689453125, 0.263671875, 0.46502685546875, 0.6663818359375, 0.86773681640625, 1.069091796875, 1.27044677734375, 1.4718017578125, 1.67315673828125, 1.87451171875, 2.07586669921875, 2.2772216796875, 2.47857666015625, 2.679931640625, 2.88128662109375, 3.0826416015625, 3.28399658203125, 3.4853515625, 3.68670654296875, 3.8880615234375, 4.08941650390625, 4.290771484375, 4.49212646484375, 4.6934814453125, 4.89483642578125, 5.09619140625, 5.29754638671875, 5.4989013671875, 5.70025634765625, 5.901611328125, 6.10296630859375, 6.3043212890625, 6.50567626953125, 6.70703125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 8.0, 4.0, 24.0, 73.0, 170.0, 283.0, 233.0, 120.0, 58.0, 13.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-216.73983764648438, -210.53208923339844, -204.3243408203125, -198.11660766601562, -191.9088592529297, -185.70111083984375, -179.4933624267578, -173.28561401367188, -167.077880859375, -160.87013244628906, -154.66238403320312, -148.45465087890625, -142.2469024658203, -136.03915405273438, -129.83140563964844, -123.6236572265625, -117.41590881347656, -111.20816040039062, -105.00041961669922, -98.79267120361328, -92.58493041992188, -86.37718200683594, -80.16943359375, -73.96168518066406, -67.75394439697266, -61.546199798583984, -55.33845520019531, -49.130706787109375, -42.9229621887207, -36.71521759033203, -30.507469177246094, -24.299724578857422, -18.09197998046875, -11.884234428405762, -5.676488876342773, 0.5312576293945312, 6.739002227783203, 12.946746826171875, 19.154495239257812, 25.362239837646484, 31.569984436035156, 37.77772903442383, 43.9854736328125, 50.19322204589844, 56.40096664428711, 62.60871124267578, 68.81645965576172, 75.02420043945312, 81.23194885253906, 87.439697265625, 93.6474380493164, 99.85518646240234, 106.06292724609375, 112.27067565917969, 118.47842407226562, 124.68617248535156, 130.8939208984375, 137.10166931152344, 143.30941772460938, 149.51715087890625, 155.7248992919922, 161.93264770507812, 168.14039611816406, 174.34814453125, 180.55587768554688]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 7.0, 11.0, 14.0, 9.0, 15.0, 31.0, 21.0, 18.0, 27.0, 30.0, 36.0, 32.0, 28.0, 32.0, 38.0, 51.0, 44.0, 66.0, 42.0, 39.0, 44.0, 37.0, 42.0, 42.0, 31.0, 36.0, 34.0, 26.0, 14.0, 16.0, 17.0, 14.0, 9.0, 10.0, 4.0, 3.0, 6.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-37.16448974609375, -35.95215606689453, -34.73982620239258, -33.52749252319336, -32.315162658691406, -31.10283088684082, -29.890499114990234, -28.678165435791016, -27.465835571289062, -26.253503799438477, -25.04117202758789, -23.828840255737305, -22.61650848388672, -21.404176712036133, -20.191844940185547, -18.979511260986328, -17.767179489135742, -16.554847717285156, -15.34251594543457, -14.130184173583984, -12.917852401733398, -11.705520629882812, -10.49318790435791, -9.280856132507324, -8.068524360656738, -6.856192588806152, -5.643860816955566, -4.431528568267822, -3.2191967964172363, -2.0068650245666504, -0.7945327758789062, 0.4177989959716797, 1.6301307678222656, 2.8424625396728516, 4.0547943115234375, 5.267126560211182, 6.479458332061768, 7.6917901039123535, 8.904122352600098, 10.116454124450684, 11.32878589630127, 12.541117668151855, 13.753449440002441, 14.965782165527344, 16.17811393737793, 17.390445709228516, 18.6027774810791, 19.815109252929688, 21.027441024780273, 22.23977279663086, 23.452104568481445, 24.66443634033203, 25.876768112182617, 27.089099884033203, 28.301433563232422, 29.513763427734375, 30.726097106933594, 31.93842887878418, 33.150760650634766, 34.363094329833984, 35.57542419433594, 36.787757873535156, 38.00008773803711, 39.21242141723633, 40.42475128173828]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 14.0, 17.0, 26.0, 50.0, 89.0, 195.0, 443.0, 1042.0, 2916.0, 9444.0, 46840.0, 723591.0, 3313888.0, 75466.0, 13626.0, 3943.0, 1359.0, 609.0, 301.0, 152.0, 93.0, 62.0, 36.0, 23.0, 19.0, 14.0, 10.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.0625, -18.4296875, -17.796875, -17.1640625, -16.53125, -15.8984375, -15.265625, -14.6328125, -14.0, -13.3671875, -12.734375, -12.1015625, -11.46875, -10.8359375, -10.203125, -9.5703125, -8.9375, -8.3046875, -7.671875, -7.0390625, -6.40625, -5.7734375, -5.140625, -4.5078125, -3.875, -3.2421875, -2.609375, -1.9765625, -1.34375, -0.7109375, -0.078125, 0.5546875, 1.1875, 1.8203125, 2.453125, 3.0859375, 3.71875, 4.3515625, 4.984375, 5.6171875, 6.25, 6.8828125, 7.515625, 8.1484375, 8.78125, 9.4140625, 10.046875, 10.6796875, 11.3125, 11.9453125, 12.578125, 13.2109375, 13.84375, 14.4765625, 15.109375, 15.7421875, 16.375, 17.0078125, 17.640625, 18.2734375, 18.90625, 19.5390625, 20.171875, 20.8046875, 21.4375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 7.0, 7.0, 4.0, 9.0, 20.0, 31.0, 36.0, 57.0, 73.0, 83.0, 86.0, 99.0, 101.0, 81.0, 89.0, 59.0, 42.0, 44.0, 29.0, 12.0, 6.0, 7.0, 3.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4296875, -2.33203125, -2.234375, -2.13671875, -2.0390625, -1.94140625, -1.84375, -1.74609375, -1.6484375, -1.55078125, -1.453125, -1.35546875, -1.2578125, -1.16015625, -1.0625, -0.96484375, -0.8671875, -0.76953125, -0.671875, -0.57421875, -0.4765625, -0.37890625, -0.28125, -0.18359375, -0.0859375, 0.01171875, 0.109375, 0.20703125, 0.3046875, 0.40234375, 0.5, 0.59765625, 0.6953125, 0.79296875, 0.890625, 0.98828125, 1.0859375, 1.18359375, 1.28125, 1.37890625, 1.4765625, 1.57421875, 1.671875, 1.76953125, 1.8671875, 1.96484375, 2.0625, 2.16015625, 2.2578125, 2.35546875, 2.453125, 2.55078125, 2.6484375, 2.74609375, 2.84375, 2.94140625, 3.0390625, 3.13671875, 3.234375, 3.33203125, 3.4296875, 3.52734375, 3.625, 3.72265625, 3.8203125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 6.0, 13.0, 9.0, 31.0, 64.0, 83.0, 164.0, 375.0, 805.0, 2202.0, 7994.0, 49832.0, 2298749.0, 1776215.0, 46833.0, 7409.0, 2025.0, 767.0, 329.0, 181.0, 89.0, 45.0, 25.0, 14.0, 10.0, 7.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.390625, -19.710693359375, -19.03076171875, -18.350830078125, -17.6708984375, -16.990966796875, -16.31103515625, -15.631103515625, -14.951171875, -14.271240234375, -13.59130859375, -12.911376953125, -12.2314453125, -11.551513671875, -10.87158203125, -10.191650390625, -9.51171875, -8.831787109375, -8.15185546875, -7.471923828125, -6.7919921875, -6.112060546875, -5.43212890625, -4.752197265625, -4.072265625, -3.392333984375, -2.71240234375, -2.032470703125, -1.3525390625, -0.672607421875, 0.00732421875, 0.687255859375, 1.3671875, 2.047119140625, 2.72705078125, 3.406982421875, 4.0869140625, 4.766845703125, 5.44677734375, 6.126708984375, 6.806640625, 7.486572265625, 8.16650390625, 8.846435546875, 9.5263671875, 10.206298828125, 10.88623046875, 11.566162109375, 12.24609375, 12.926025390625, 13.60595703125, 14.285888671875, 14.9658203125, 15.645751953125, 16.32568359375, 17.005615234375, 17.685546875, 18.365478515625, 19.04541015625, 19.725341796875, 20.4052734375, 21.085205078125, 21.76513671875, 22.445068359375, 23.125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 6.0, 11.0, 13.0, 18.0, 27.0, 54.0, 57.0, 142.0, 230.0, 448.0, 1516.0, 791.0, 328.0, 174.0, 96.0, 62.0, 24.0, 20.0, 19.0, 9.0, 9.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.09375, -7.87939453125, -7.6650390625, -7.45068359375, -7.236328125, -7.02197265625, -6.8076171875, -6.59326171875, -6.37890625, -6.16455078125, -5.9501953125, -5.73583984375, -5.521484375, -5.30712890625, -5.0927734375, -4.87841796875, -4.6640625, -4.44970703125, -4.2353515625, -4.02099609375, -3.806640625, -3.59228515625, -3.3779296875, -3.16357421875, -2.94921875, -2.73486328125, -2.5205078125, -2.30615234375, -2.091796875, -1.87744140625, -1.6630859375, -1.44873046875, -1.234375, -1.02001953125, -0.8056640625, -0.59130859375, -0.376953125, -0.16259765625, 0.0517578125, 0.26611328125, 0.48046875, 0.69482421875, 0.9091796875, 1.12353515625, 1.337890625, 1.55224609375, 1.7666015625, 1.98095703125, 2.1953125, 2.40966796875, 2.6240234375, 2.83837890625, 3.052734375, 3.26708984375, 3.4814453125, 3.69580078125, 3.91015625, 4.12451171875, 4.3388671875, 4.55322265625, 4.767578125, 4.98193359375, 5.1962890625, 5.41064453125, 5.625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 0.0, 4.0, 15.0, 19.0, 41.0, 100.0, 150.0, 217.0, 218.0, 135.0, 64.0, 26.0, 9.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-92.45757293701172, -90.45150756835938, -88.44544219970703, -86.43937683105469, -84.43331146240234, -82.42724609375, -80.42118072509766, -78.41511535644531, -76.40904998779297, -74.40298461914062, -72.39691925048828, -70.39085388183594, -68.3847885131836, -66.37872314453125, -64.3726577758789, -62.36659240722656, -60.36052703857422, -58.354461669921875, -56.34839630126953, -54.34233093261719, -52.336265563964844, -50.3302001953125, -48.324134826660156, -46.31806945800781, -44.31200408935547, -42.305938720703125, -40.29987335205078, -38.29380798339844, -36.287742614746094, -34.28167724609375, -32.275611877441406, -30.269546508789062, -28.26348114013672, -26.257415771484375, -24.25135040283203, -22.245285034179688, -20.239219665527344, -18.233154296875, -16.227088928222656, -14.221023559570312, -12.214958190917969, -10.208892822265625, -8.202827453613281, -6.1967620849609375, -4.190696716308594, -2.18463134765625, -0.17856597900390625, 1.8274993896484375, 3.8335647583007812, 5.839630126953125, 7.845695495605469, 9.851760864257812, 11.857826232910156, 13.8638916015625, 15.869956970214844, 17.876022338867188, 19.88208770751953, 21.888153076171875, 23.89421844482422, 25.900283813476562, 27.906349182128906, 29.91241455078125, 31.918479919433594, 33.92454528808594, 35.93061065673828]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 6.0, 3.0, 4.0, 9.0, 11.0, 16.0, 18.0, 20.0, 24.0, 35.0, 21.0, 25.0, 38.0, 33.0, 41.0, 36.0, 30.0, 51.0, 38.0, 50.0, 54.0, 52.0, 56.0, 47.0, 48.0, 37.0, 34.0, 34.0, 25.0, 16.0, 19.0, 12.0, 9.0, 8.0, 9.0, 12.0, 10.0, 7.0, 8.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.917516708374023, -19.29121971130371, -18.6649227142334, -18.038623809814453, -17.41232681274414, -16.786029815673828, -16.159732818603516, -15.533435821533203, -14.907137870788574, -14.280840873718262, -13.654542922973633, -13.02824592590332, -12.401948928833008, -11.775650978088379, -11.149353981018066, -10.523056030273438, -9.896759033203125, -9.270462036132812, -8.644164085388184, -8.017867088317871, -7.3915696144104, -6.76527214050293, -6.138975143432617, -5.5126776695251465, -4.886380195617676, -4.260082721710205, -3.6337854862213135, -3.007488250732422, -2.381190776824951, -1.7548933029174805, -1.1285960674285889, -0.5022988319396973, 0.12399673461914062, 0.7502940893173218, 1.376591444015503, 2.0028886795043945, 2.6291861534118652, 3.255483627319336, 3.8817808628082275, 4.508078098297119, 5.13437557220459, 5.7606730461120605, 6.386970520019531, 7.013267517089844, 7.6395649909973145, 8.265862464904785, 8.892159461975098, 9.518457412719727, 10.144754409790039, 10.771051406860352, 11.39734935760498, 12.023646354675293, 12.649944305419922, 13.276241302490234, 13.902538299560547, 14.52883529663086, 15.155133247375488, 15.7814302444458, 16.40772819519043, 17.034025192260742, 17.660322189331055, 18.28662109375, 18.912918090820312, 19.539215087890625, 20.165512084960938]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 2.0, 7.0, 7.0, 13.0, 11.0, 32.0, 22.0, 49.0, 73.0, 108.0, 237.0, 386.0, 647.0, 1154.0, 2246.0, 4674.0, 10546.0, 26891.0, 77104.0, 240742.0, 431958.0, 162902.0, 53442.0, 19490.0, 7950.0, 3725.0, 1780.0, 974.0, 547.0, 339.0, 205.0, 114.0, 67.0, 33.0, 34.0, 20.0, 12.0, 10.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.5625, -16.09375, -15.625, -15.15625, -14.6875, -14.21875, -13.75, -13.28125, -12.8125, -12.34375, -11.875, -11.40625, -10.9375, -10.46875, -10.0, -9.53125, -9.0625, -8.59375, -8.125, -7.65625, -7.1875, -6.71875, -6.25, -5.78125, -5.3125, -4.84375, -4.375, -3.90625, -3.4375, -2.96875, -2.5, -2.03125, -1.5625, -1.09375, -0.625, -0.15625, 0.3125, 0.78125, 1.25, 1.71875, 2.1875, 2.65625, 3.125, 3.59375, 4.0625, 4.53125, 5.0, 5.46875, 5.9375, 6.40625, 6.875, 7.34375, 7.8125, 8.28125, 8.75, 9.21875, 9.6875, 10.15625, 10.625, 11.09375, 11.5625, 12.03125, 12.5, 12.96875, 13.4375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 4.0, 11.0, 16.0, 22.0, 44.0, 41.0, 58.0, 72.0, 82.0, 84.0, 107.0, 76.0, 88.0, 65.0, 60.0, 48.0, 32.0, 26.0, 20.0, 10.0, 6.0, 4.0, 4.0, 5.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.525390625, -2.4267578125, -2.328125, -2.2294921875, -2.130859375, -2.0322265625, -1.93359375, -1.8349609375, -1.736328125, -1.6376953125, -1.5390625, -1.4404296875, -1.341796875, -1.2431640625, -1.14453125, -1.0458984375, -0.947265625, -0.8486328125, -0.75, -0.6513671875, -0.552734375, -0.4541015625, -0.35546875, -0.2568359375, -0.158203125, -0.0595703125, 0.0390625, 0.1376953125, 0.236328125, 0.3349609375, 0.43359375, 0.5322265625, 0.630859375, 0.7294921875, 0.828125, 0.9267578125, 1.025390625, 1.1240234375, 1.22265625, 1.3212890625, 1.419921875, 1.5185546875, 1.6171875, 1.7158203125, 1.814453125, 1.9130859375, 2.01171875, 2.1103515625, 2.208984375, 2.3076171875, 2.40625, 2.5048828125, 2.603515625, 2.7021484375, 2.80078125, 2.8994140625, 2.998046875, 3.0966796875, 3.1953125, 3.2939453125, 3.392578125, 3.4912109375, 3.58984375, 3.6884765625, 3.787109375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 7.0, 10.0, 8.0, 17.0, 19.0, 26.0, 36.0, 55.0, 66.0, 103.0, 127.0, 191.0, 372.0, 607.0, 1032.0, 2055.0, 4846.0, 12563.0, 40141.0, 151814.0, 495363.0, 246595.0, 61980.0, 18300.0, 6381.0, 2728.0, 1267.0, 682.0, 368.0, 263.0, 158.0, 120.0, 76.0, 51.0, 27.0, 32.0, 25.0, 14.0, 10.0, 8.0, 7.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.09375, -16.6007080078125, -16.107666015625, -15.6146240234375, -15.12158203125, -14.6285400390625, -14.135498046875, -13.6424560546875, -13.1494140625, -12.6563720703125, -12.163330078125, -11.6702880859375, -11.17724609375, -10.6842041015625, -10.191162109375, -9.6981201171875, -9.205078125, -8.7120361328125, -8.218994140625, -7.7259521484375, -7.23291015625, -6.7398681640625, -6.246826171875, -5.7537841796875, -5.2607421875, -4.7677001953125, -4.274658203125, -3.7816162109375, -3.28857421875, -2.7955322265625, -2.302490234375, -1.8094482421875, -1.31640625, -0.8233642578125, -0.330322265625, 0.1627197265625, 0.65576171875, 1.1488037109375, 1.641845703125, 2.1348876953125, 2.6279296875, 3.1209716796875, 3.614013671875, 4.1070556640625, 4.60009765625, 5.0931396484375, 5.586181640625, 6.0792236328125, 6.572265625, 7.0653076171875, 7.558349609375, 8.0513916015625, 8.54443359375, 9.0374755859375, 9.530517578125, 10.0235595703125, 10.5166015625, 11.0096435546875, 11.502685546875, 11.9957275390625, 12.48876953125, 12.9818115234375, 13.474853515625, 13.9678955078125, 14.4609375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 3.0, 8.0, 8.0, 10.0, 12.0, 11.0, 10.0, 19.0, 20.0, 16.0, 23.0, 36.0, 41.0, 33.0, 39.0, 51.0, 50.0, 39.0, 47.0, 48.0, 55.0, 34.0, 42.0, 47.0, 44.0, 36.0, 40.0, 32.0, 28.0, 25.0, 22.0, 11.0, 16.0, 15.0, 5.0, 5.0, 5.0, 6.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.109375, -7.8529052734375, -7.596435546875, -7.3399658203125, -7.08349609375, -6.8270263671875, -6.570556640625, -6.3140869140625, -6.0576171875, -5.8011474609375, -5.544677734375, -5.2882080078125, -5.03173828125, -4.7752685546875, -4.518798828125, -4.2623291015625, -4.005859375, -3.7493896484375, -3.492919921875, -3.2364501953125, -2.97998046875, -2.7235107421875, -2.467041015625, -2.2105712890625, -1.9541015625, -1.6976318359375, -1.441162109375, -1.1846923828125, -0.92822265625, -0.6717529296875, -0.415283203125, -0.1588134765625, 0.09765625, 0.3541259765625, 0.610595703125, 0.8670654296875, 1.12353515625, 1.3800048828125, 1.636474609375, 1.8929443359375, 2.1494140625, 2.4058837890625, 2.662353515625, 2.9188232421875, 3.17529296875, 3.4317626953125, 3.688232421875, 3.9447021484375, 4.201171875, 4.4576416015625, 4.714111328125, 4.9705810546875, 5.22705078125, 5.4835205078125, 5.739990234375, 5.9964599609375, 6.2529296875, 6.5093994140625, 6.765869140625, 7.0223388671875, 7.27880859375, 7.5352783203125, 7.791748046875, 8.0482177734375, 8.3046875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 8.0, 12.0, 13.0, 21.0, 35.0, 93.0, 155.0, 331.0, 820.0, 3004.0, 24394.0, 909427.0, 101540.0, 6484.0, 1360.0, 434.0, 171.0, 104.0, 58.0, 25.0, 28.0, 10.0, 6.0, 4.0, 8.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.75, -21.95751953125, -21.1650390625, -20.37255859375, -19.580078125, -18.78759765625, -17.9951171875, -17.20263671875, -16.41015625, -15.61767578125, -14.8251953125, -14.03271484375, -13.240234375, -12.44775390625, -11.6552734375, -10.86279296875, -10.0703125, -9.27783203125, -8.4853515625, -7.69287109375, -6.900390625, -6.10791015625, -5.3154296875, -4.52294921875, -3.73046875, -2.93798828125, -2.1455078125, -1.35302734375, -0.560546875, 0.23193359375, 1.0244140625, 1.81689453125, 2.609375, 3.40185546875, 4.1943359375, 4.98681640625, 5.779296875, 6.57177734375, 7.3642578125, 8.15673828125, 8.94921875, 9.74169921875, 10.5341796875, 11.32666015625, 12.119140625, 12.91162109375, 13.7041015625, 14.49658203125, 15.2890625, 16.08154296875, 16.8740234375, 17.66650390625, 18.458984375, 19.25146484375, 20.0439453125, 20.83642578125, 21.62890625, 22.42138671875, 23.2138671875, 24.00634765625, 24.798828125, 25.59130859375, 26.3837890625, 27.17626953125, 27.96875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 12.0, 14.0, 21.0, 23.0, 68.0, 118.0, 191.0, 184.0, 141.0, 89.0, 33.0, 31.0, 25.0, 11.0, 7.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018768310546875, -0.0018166899681091309, -0.0017565488815307617, -0.0016964077949523926, -0.0016362667083740234, -0.0015761256217956543, -0.0015159845352172852, -0.001455843448638916, -0.0013957023620605469, -0.0013355612754821777, -0.0012754201889038086, -0.0012152791023254395, -0.0011551380157470703, -0.0010949969291687012, -0.001034855842590332, -0.0009747147560119629, -0.0009145736694335938, -0.0008544325828552246, -0.0007942914962768555, -0.0007341504096984863, -0.0006740093231201172, -0.000613868236541748, -0.0005537271499633789, -0.0004935860633850098, -0.0004334449768066406, -0.0003733038902282715, -0.00031316280364990234, -0.0002530217170715332, -0.00019288063049316406, -0.00013273954391479492, -7.259845733642578e-05, -1.245737075805664e-05, 4.76837158203125e-05, 0.00010782480239868164, 0.00016796588897705078, 0.00022810697555541992, 0.00028824806213378906, 0.0003483891487121582, 0.00040853023529052734, 0.0004686713218688965, 0.0005288124084472656, 0.0005889534950256348, 0.0006490945816040039, 0.000709235668182373, 0.0007693767547607422, 0.0008295178413391113, 0.0008896589279174805, 0.0009498000144958496, 0.0010099411010742188, 0.0010700821876525879, 0.001130223274230957, 0.0011903643608093262, 0.0012505054473876953, 0.0013106465339660645, 0.0013707876205444336, 0.0014309287071228027, 0.0014910697937011719, 0.001551210880279541, 0.0016113519668579102, 0.0016714930534362793, 0.0017316341400146484, 0.0017917752265930176, 0.0018519163131713867, 0.0019120573997497559, 0.001972198486328125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 8.0, 1.0, 4.0, 4.0, 10.0, 23.0, 20.0, 40.0, 67.0, 96.0, 163.0, 282.0, 687.0, 2026.0, 11055.0, 338561.0, 676830.0, 14831.0, 2361.0, 701.0, 289.0, 187.0, 111.0, 62.0, 38.0, 30.0, 20.0, 15.0, 8.0, 7.0, 4.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.546875, -21.885009765625, -21.22314453125, -20.561279296875, -19.8994140625, -19.237548828125, -18.57568359375, -17.913818359375, -17.251953125, -16.590087890625, -15.92822265625, -15.266357421875, -14.6044921875, -13.942626953125, -13.28076171875, -12.618896484375, -11.95703125, -11.295166015625, -10.63330078125, -9.971435546875, -9.3095703125, -8.647705078125, -7.98583984375, -7.323974609375, -6.662109375, -6.000244140625, -5.33837890625, -4.676513671875, -4.0146484375, -3.352783203125, -2.69091796875, -2.029052734375, -1.3671875, -0.705322265625, -0.04345703125, 0.618408203125, 1.2802734375, 1.942138671875, 2.60400390625, 3.265869140625, 3.927734375, 4.589599609375, 5.25146484375, 5.913330078125, 6.5751953125, 7.237060546875, 7.89892578125, 8.560791015625, 9.22265625, 9.884521484375, 10.54638671875, 11.208251953125, 11.8701171875, 12.531982421875, 13.19384765625, 13.855712890625, 14.517578125, 15.179443359375, 15.84130859375, 16.503173828125, 17.1650390625, 17.826904296875, 18.48876953125, 19.150634765625, 19.8125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 7.0, 11.0, 12.0, 26.0, 67.0, 92.0, 179.0, 225.0, 161.0, 84.0, 53.0, 27.0, 15.0, 12.0, 4.0, 4.0, 8.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.59375, -9.16748046875, -8.7412109375, -8.31494140625, -7.888671875, -7.46240234375, -7.0361328125, -6.60986328125, -6.18359375, -5.75732421875, -5.3310546875, -4.90478515625, -4.478515625, -4.05224609375, -3.6259765625, -3.19970703125, -2.7734375, -2.34716796875, -1.9208984375, -1.49462890625, -1.068359375, -0.64208984375, -0.2158203125, 0.21044921875, 0.63671875, 1.06298828125, 1.4892578125, 1.91552734375, 2.341796875, 2.76806640625, 3.1943359375, 3.62060546875, 4.046875, 4.47314453125, 4.8994140625, 5.32568359375, 5.751953125, 6.17822265625, 6.6044921875, 7.03076171875, 7.45703125, 7.88330078125, 8.3095703125, 8.73583984375, 9.162109375, 9.58837890625, 10.0146484375, 10.44091796875, 10.8671875, 11.29345703125, 11.7197265625, 12.14599609375, 12.572265625, 12.99853515625, 13.4248046875, 13.85107421875, 14.27734375, 14.70361328125, 15.1298828125, 15.55615234375, 15.982421875, 16.40869140625, 16.8349609375, 17.26123046875, 17.6875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 13.0, 18.0, 27.0, 74.0, 159.0, 245.0, 231.0, 141.0, 60.0, 19.0, 9.0, 7.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-242.52931213378906, -235.78237915039062, -229.03543090820312, -222.2884979248047, -215.54156494140625, -208.79461669921875, -202.0476837158203, -195.30075073242188, -188.55380249023438, -181.80686950683594, -175.05992126464844, -168.31298828125, -161.56605529785156, -154.81912231445312, -148.07217407226562, -141.3252410888672, -134.57830810546875, -127.83136749267578, -121.08443450927734, -114.33749389648438, -107.59056091308594, -100.84362030029297, -94.0966796875, -87.34974670410156, -80.6028060913086, -73.85586547851562, -67.10893249511719, -60.36199188232422, -53.615055084228516, -46.86811828613281, -40.121177673339844, -33.37424087524414, -26.6273193359375, -19.880382537841797, -13.133443832397461, -6.386505126953125, 0.3604316711425781, 7.107368469238281, 13.85430908203125, 20.601245880126953, 27.348182678222656, 34.09511947631836, 40.84205627441406, 47.58899688720703, 54.335933685302734, 61.08287048339844, 67.8298110961914, 74.57675170898438, 81.32368469238281, 88.07062530517578, 94.81755828857422, 101.56449890136719, 108.31143188476562, 115.0583724975586, 121.80531311035156, 128.55224609375, 135.2991943359375, 142.04612731933594, 148.79307556152344, 155.54000854492188, 162.2869415283203, 169.03387451171875, 175.78082275390625, 182.5277557373047, 189.27468872070312]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 5.0, 7.0, 2.0, 6.0, 9.0, 10.0, 15.0, 20.0, 11.0, 17.0, 15.0, 14.0, 32.0, 25.0, 20.0, 32.0, 30.0, 34.0, 35.0, 37.0, 27.0, 34.0, 29.0, 46.0, 42.0, 47.0, 31.0, 40.0, 33.0, 35.0, 26.0, 31.0, 29.0, 21.0, 23.0, 17.0, 25.0, 23.0, 10.0, 12.0, 10.0, 9.0, 8.0, 5.0, 3.0, 3.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-37.47075271606445, -36.26725769042969, -35.06376647949219, -33.86027145385742, -32.65678024291992, -31.453285217285156, -30.249792098999023, -29.04629898071289, -27.842805862426758, -26.639312744140625, -25.435819625854492, -24.23232650756836, -23.028831481933594, -21.825340270996094, -20.621845245361328, -19.418352127075195, -18.214859008789062, -17.01136589050293, -15.807872772216797, -14.604378700256348, -13.400885581970215, -12.197392463684082, -10.993898391723633, -9.7904052734375, -8.586912155151367, -7.383419036865234, -6.179925441741943, -4.976431846618652, -3.7729387283325195, -2.5694456100463867, -1.3659520149230957, -0.1624584197998047, 1.0410308837890625, 2.2445242404937744, 3.4480175971984863, 4.651511192321777, 5.85500431060791, 7.058497428894043, 8.261991500854492, 9.465484619140625, 10.668977737426758, 11.87247085571289, 13.075963973999023, 14.279458045959473, 15.482951164245605, 16.686443328857422, 17.889938354492188, 19.09343147277832, 20.296924591064453, 21.500417709350586, 22.70391082763672, 23.90740394592285, 25.110897064208984, 26.31439208984375, 27.517885208129883, 28.721378326416016, 29.92487144470215, 31.12836456298828, 32.33185958862305, 33.53535079956055, 34.73884582519531, 35.94233703613281, 37.14583206176758, 38.349327087402344, 39.552818298339844]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 9.0, 14.0, 16.0, 15.0, 28.0, 54.0, 81.0, 143.0, 242.0, 440.0, 847.0, 2021.0, 5179.0, 15077.0, 64170.0, 1422916.0, 2590761.0, 67053.0, 15676.0, 5255.0, 2086.0, 967.0, 518.0, 259.0, 164.0, 102.0, 57.0, 37.0, 34.0, 20.0, 10.0, 7.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8125, -15.28564453125, -14.7587890625, -14.23193359375, -13.705078125, -13.17822265625, -12.6513671875, -12.12451171875, -11.59765625, -11.07080078125, -10.5439453125, -10.01708984375, -9.490234375, -8.96337890625, -8.4365234375, -7.90966796875, -7.3828125, -6.85595703125, -6.3291015625, -5.80224609375, -5.275390625, -4.74853515625, -4.2216796875, -3.69482421875, -3.16796875, -2.64111328125, -2.1142578125, -1.58740234375, -1.060546875, -0.53369140625, -0.0068359375, 0.52001953125, 1.046875, 1.57373046875, 2.1005859375, 2.62744140625, 3.154296875, 3.68115234375, 4.2080078125, 4.73486328125, 5.26171875, 5.78857421875, 6.3154296875, 6.84228515625, 7.369140625, 7.89599609375, 8.4228515625, 8.94970703125, 9.4765625, 10.00341796875, 10.5302734375, 11.05712890625, 11.583984375, 12.11083984375, 12.6376953125, 13.16455078125, 13.69140625, 14.21826171875, 14.7451171875, 15.27197265625, 15.798828125, 16.32568359375, 16.8525390625, 17.37939453125, 17.90625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 9.0, 2.0, 11.0, 11.0, 18.0, 31.0, 35.0, 49.0, 58.0, 57.0, 101.0, 86.0, 77.0, 89.0, 68.0, 58.0, 53.0, 54.0, 50.0, 31.0, 12.0, 13.0, 6.0, 12.0, 2.0, 4.0, 3.0, 0.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.03125, -2.92523193359375, -2.8192138671875, -2.71319580078125, -2.607177734375, -2.50115966796875, -2.3951416015625, -2.28912353515625, -2.18310546875, -2.07708740234375, -1.9710693359375, -1.86505126953125, -1.759033203125, -1.65301513671875, -1.5469970703125, -1.44097900390625, -1.3349609375, -1.22894287109375, -1.1229248046875, -1.01690673828125, -0.910888671875, -0.80487060546875, -0.6988525390625, -0.59283447265625, -0.48681640625, -0.38079833984375, -0.2747802734375, -0.16876220703125, -0.062744140625, 0.04327392578125, 0.1492919921875, 0.25531005859375, 0.361328125, 0.46734619140625, 0.5733642578125, 0.67938232421875, 0.785400390625, 0.89141845703125, 0.9974365234375, 1.10345458984375, 1.20947265625, 1.31549072265625, 1.4215087890625, 1.52752685546875, 1.633544921875, 1.73956298828125, 1.8455810546875, 1.95159912109375, 2.0576171875, 2.16363525390625, 2.2696533203125, 2.37567138671875, 2.481689453125, 2.58770751953125, 2.6937255859375, 2.79974365234375, 2.90576171875, 3.01177978515625, 3.1177978515625, 3.22381591796875, 3.329833984375, 3.43585205078125, 3.5418701171875, 3.64788818359375, 3.75390625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 11.0, 13.0, 19.0, 28.0, 32.0, 47.0, 102.0, 164.0, 313.0, 584.0, 1154.0, 2499.0, 5864.0, 17224.0, 64152.0, 564909.0, 3362606.0, 130690.0, 28570.0, 8806.0, 3396.0, 1456.0, 729.0, 371.0, 216.0, 114.0, 75.0, 46.0, 35.0, 14.0, 14.0, 4.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.0234375, -14.571044921875, -14.11865234375, -13.666259765625, -13.2138671875, -12.761474609375, -12.30908203125, -11.856689453125, -11.404296875, -10.951904296875, -10.49951171875, -10.047119140625, -9.5947265625, -9.142333984375, -8.68994140625, -8.237548828125, -7.78515625, -7.332763671875, -6.88037109375, -6.427978515625, -5.9755859375, -5.523193359375, -5.07080078125, -4.618408203125, -4.166015625, -3.713623046875, -3.26123046875, -2.808837890625, -2.3564453125, -1.904052734375, -1.45166015625, -0.999267578125, -0.546875, -0.094482421875, 0.35791015625, 0.810302734375, 1.2626953125, 1.715087890625, 2.16748046875, 2.619873046875, 3.072265625, 3.524658203125, 3.97705078125, 4.429443359375, 4.8818359375, 5.334228515625, 5.78662109375, 6.239013671875, 6.69140625, 7.143798828125, 7.59619140625, 8.048583984375, 8.5009765625, 8.953369140625, 9.40576171875, 9.858154296875, 10.310546875, 10.762939453125, 11.21533203125, 11.667724609375, 12.1201171875, 12.572509765625, 13.02490234375, 13.477294921875, 13.9296875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 4.0, 5.0, 8.0, 13.0, 24.0, 20.0, 42.0, 44.0, 81.0, 156.0, 284.0, 961.0, 1647.0, 352.0, 175.0, 78.0, 52.0, 39.0, 32.0, 16.0, 13.0, 5.0, 3.0, 3.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5, -6.30938720703125, -6.1187744140625, -5.92816162109375, -5.737548828125, -5.54693603515625, -5.3563232421875, -5.16571044921875, -4.97509765625, -4.78448486328125, -4.5938720703125, -4.40325927734375, -4.212646484375, -4.02203369140625, -3.8314208984375, -3.64080810546875, -3.4501953125, -3.25958251953125, -3.0689697265625, -2.87835693359375, -2.687744140625, -2.49713134765625, -2.3065185546875, -2.11590576171875, -1.92529296875, -1.73468017578125, -1.5440673828125, -1.35345458984375, -1.162841796875, -0.97222900390625, -0.7816162109375, -0.59100341796875, -0.400390625, -0.20977783203125, -0.0191650390625, 0.17144775390625, 0.362060546875, 0.55267333984375, 0.7432861328125, 0.93389892578125, 1.12451171875, 1.31512451171875, 1.5057373046875, 1.69635009765625, 1.886962890625, 2.07757568359375, 2.2681884765625, 2.45880126953125, 2.6494140625, 2.84002685546875, 3.0306396484375, 3.22125244140625, 3.411865234375, 3.60247802734375, 3.7930908203125, 3.98370361328125, 4.17431640625, 4.36492919921875, 4.5555419921875, 4.74615478515625, 4.936767578125, 5.12738037109375, 5.3179931640625, 5.50860595703125, 5.69921875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 6.0, 21.0, 26.0, 56.0, 150.0, 233.0, 226.0, 146.0, 80.0, 35.0, 11.0, 5.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.59926986694336, -57.751243591308594, -55.903221130371094, -54.055198669433594, -52.20717239379883, -50.35914611816406, -48.51112365722656, -46.66310119628906, -44.8150749206543, -42.96704864501953, -41.11902618408203, -39.27100372314453, -37.422977447509766, -35.574951171875, -33.7269287109375, -31.878904342651367, -30.030879974365234, -28.1828556060791, -26.33483123779297, -24.486806869506836, -22.638782501220703, -20.79075813293457, -18.942733764648438, -17.094709396362305, -15.246685028076172, -13.398660659790039, -11.550636291503906, -9.702611923217773, -7.854587554931641, -6.006563186645508, -4.158538818359375, -2.310514450073242, -0.46248626708984375, 1.385538101196289, 3.233562469482422, 5.081586837768555, 6.9296112060546875, 8.77763557434082, 10.625659942626953, 12.473684310913086, 14.321708679199219, 16.16973304748535, 18.017757415771484, 19.865781784057617, 21.71380615234375, 23.561830520629883, 25.409854888916016, 27.25787925720215, 29.10590362548828, 30.953927993774414, 32.80195236206055, 34.64997863769531, 36.49800109863281, 38.34602355957031, 40.19404983520508, 42.042076110839844, 43.890098571777344, 45.738121032714844, 47.58614730834961, 49.434173583984375, 51.282196044921875, 53.130218505859375, 54.97824478149414, 56.826271057128906, 58.674293518066406]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 4.0, 3.0, 11.0, 13.0, 11.0, 13.0, 13.0, 17.0, 20.0, 16.0, 14.0, 32.0, 35.0, 40.0, 43.0, 34.0, 46.0, 38.0, 46.0, 45.0, 40.0, 40.0, 40.0, 39.0, 35.0, 37.0, 46.0, 37.0, 31.0, 30.0, 16.0, 25.0, 19.0, 15.0, 17.0, 11.0, 8.0, 4.0, 8.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.519676208496094, -15.999293327331543, -15.478910446166992, -14.958526611328125, -14.438143730163574, -13.917760848999023, -13.397377014160156, -12.876994132995605, -12.356611251831055, -11.836228370666504, -11.315845489501953, -10.795461654663086, -10.275078773498535, -9.754695892333984, -9.234312057495117, -8.713929176330566, -8.193546295166016, -7.673163414001465, -7.152780055999756, -6.632396697998047, -6.112013816833496, -5.591630935668945, -5.071247577667236, -4.550864219665527, -4.030481338500977, -3.5100982189178467, -2.989715099334717, -2.469331979751587, -1.948948860168457, -1.4285657405853271, -0.9081826210021973, -0.3877995014190674, 0.1325855255126953, 0.6529686450958252, 1.173351764678955, 1.693734884262085, 2.214118003845215, 2.7345011234283447, 3.2548842430114746, 3.7752673625946045, 4.295650482177734, 4.816033363342285, 5.336416721343994, 5.856800079345703, 6.377182960510254, 6.897565841674805, 7.417949199676514, 7.938332557678223, 8.458715438842773, 8.979098320007324, 9.499481201171875, 10.019865036010742, 10.540247917175293, 11.060630798339844, 11.581014633178711, 12.101397514343262, 12.621780395507812, 13.142163276672363, 13.662546157836914, 14.182929992675781, 14.703312873840332, 15.223695755004883, 15.74407958984375, 16.264461517333984, 16.78484535217285]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 4.0, 2.0, 2.0, 7.0, 8.0, 18.0, 19.0, 34.0, 69.0, 96.0, 207.0, 372.0, 685.0, 1382.0, 3120.0, 7212.0, 18727.0, 53037.0, 167331.0, 440667.0, 238489.0, 74773.0, 25485.0, 9509.0, 3790.0, 1706.0, 859.0, 406.0, 237.0, 133.0, 81.0, 38.0, 17.0, 22.0, 10.0, 4.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6328125, -10.1832275390625, -9.733642578125, -9.2840576171875, -8.83447265625, -8.3848876953125, -7.935302734375, -7.4857177734375, -7.0361328125, -6.5865478515625, -6.136962890625, -5.6873779296875, -5.23779296875, -4.7882080078125, -4.338623046875, -3.8890380859375, -3.439453125, -2.9898681640625, -2.540283203125, -2.0906982421875, -1.64111328125, -1.1915283203125, -0.741943359375, -0.2923583984375, 0.1572265625, 0.6068115234375, 1.056396484375, 1.5059814453125, 1.95556640625, 2.4051513671875, 2.854736328125, 3.3043212890625, 3.75390625, 4.2034912109375, 4.653076171875, 5.1026611328125, 5.55224609375, 6.0018310546875, 6.451416015625, 6.9010009765625, 7.3505859375, 7.8001708984375, 8.249755859375, 8.6993408203125, 9.14892578125, 9.5985107421875, 10.048095703125, 10.4976806640625, 10.947265625, 11.3968505859375, 11.846435546875, 12.2960205078125, 12.74560546875, 13.1951904296875, 13.644775390625, 14.0943603515625, 14.5439453125, 14.9935302734375, 15.443115234375, 15.8927001953125, 16.34228515625, 16.7918701171875, 17.241455078125, 17.6910400390625, 18.140625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 10.0, 12.0, 14.0, 19.0, 22.0, 29.0, 40.0, 42.0, 65.0, 70.0, 81.0, 84.0, 66.0, 83.0, 59.0, 57.0, 57.0, 46.0, 42.0, 30.0, 21.0, 15.0, 11.0, 4.0, 7.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.060546875, -2.955902099609375, -2.85125732421875, -2.746612548828125, -2.6419677734375, -2.537322998046875, -2.43267822265625, -2.328033447265625, -2.223388671875, -2.118743896484375, -2.01409912109375, -1.909454345703125, -1.8048095703125, -1.700164794921875, -1.59552001953125, -1.490875244140625, -1.38623046875, -1.281585693359375, -1.17694091796875, -1.072296142578125, -0.9676513671875, -0.863006591796875, -0.75836181640625, -0.653717041015625, -0.549072265625, -0.444427490234375, -0.33978271484375, -0.235137939453125, -0.1304931640625, -0.025848388671875, 0.07879638671875, 0.183441162109375, 0.2880859375, 0.392730712890625, 0.49737548828125, 0.602020263671875, 0.7066650390625, 0.811309814453125, 0.91595458984375, 1.020599365234375, 1.125244140625, 1.229888916015625, 1.33453369140625, 1.439178466796875, 1.5438232421875, 1.648468017578125, 1.75311279296875, 1.857757568359375, 1.96240234375, 2.067047119140625, 2.17169189453125, 2.276336669921875, 2.3809814453125, 2.485626220703125, 2.59027099609375, 2.694915771484375, 2.799560546875, 2.904205322265625, 3.00885009765625, 3.113494873046875, 3.2181396484375, 3.322784423828125, 3.42742919921875, 3.532073974609375, 3.63671875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 4.0, 2.0, 5.0, 18.0, 19.0, 22.0, 14.0, 38.0, 71.0, 110.0, 144.0, 215.0, 429.0, 754.0, 1668.0, 3968.0, 10904.0, 35116.0, 126640.0, 468921.0, 292086.0, 73234.0, 21585.0, 7243.0, 2718.0, 1177.0, 583.0, 305.0, 193.0, 130.0, 66.0, 48.0, 30.0, 26.0, 14.0, 11.0, 16.0, 9.0, 8.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.375, -13.908203125, -13.44140625, -12.974609375, -12.5078125, -12.041015625, -11.57421875, -11.107421875, -10.640625, -10.173828125, -9.70703125, -9.240234375, -8.7734375, -8.306640625, -7.83984375, -7.373046875, -6.90625, -6.439453125, -5.97265625, -5.505859375, -5.0390625, -4.572265625, -4.10546875, -3.638671875, -3.171875, -2.705078125, -2.23828125, -1.771484375, -1.3046875, -0.837890625, -0.37109375, 0.095703125, 0.5625, 1.029296875, 1.49609375, 1.962890625, 2.4296875, 2.896484375, 3.36328125, 3.830078125, 4.296875, 4.763671875, 5.23046875, 5.697265625, 6.1640625, 6.630859375, 7.09765625, 7.564453125, 8.03125, 8.498046875, 8.96484375, 9.431640625, 9.8984375, 10.365234375, 10.83203125, 11.298828125, 11.765625, 12.232421875, 12.69921875, 13.166015625, 13.6328125, 14.099609375, 14.56640625, 15.033203125, 15.5]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 2.0, 6.0, 7.0, 5.0, 6.0, 11.0, 12.0, 14.0, 17.0, 19.0, 35.0, 28.0, 22.0, 28.0, 35.0, 58.0, 31.0, 45.0, 48.0, 47.0, 39.0, 42.0, 45.0, 50.0, 27.0, 33.0, 38.0, 32.0, 27.0, 26.0, 32.0, 22.0, 19.0, 19.0, 15.0, 11.0, 8.0, 8.0, 8.0, 5.0, 4.0, 2.0, 4.0, 9.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.78125, -9.504150390625, -9.22705078125, -8.949951171875, -8.6728515625, -8.395751953125, -8.11865234375, -7.841552734375, -7.564453125, -7.287353515625, -7.01025390625, -6.733154296875, -6.4560546875, -6.178955078125, -5.90185546875, -5.624755859375, -5.34765625, -5.070556640625, -4.79345703125, -4.516357421875, -4.2392578125, -3.962158203125, -3.68505859375, -3.407958984375, -3.130859375, -2.853759765625, -2.57666015625, -2.299560546875, -2.0224609375, -1.745361328125, -1.46826171875, -1.191162109375, -0.9140625, -0.636962890625, -0.35986328125, -0.082763671875, 0.1943359375, 0.471435546875, 0.74853515625, 1.025634765625, 1.302734375, 1.579833984375, 1.85693359375, 2.134033203125, 2.4111328125, 2.688232421875, 2.96533203125, 3.242431640625, 3.51953125, 3.796630859375, 4.07373046875, 4.350830078125, 4.6279296875, 4.905029296875, 5.18212890625, 5.459228515625, 5.736328125, 6.013427734375, 6.29052734375, 6.567626953125, 6.8447265625, 7.121826171875, 7.39892578125, 7.676025390625, 7.953125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 9.0, 4.0, 10.0, 15.0, 31.0, 43.0, 66.0, 110.0, 219.0, 424.0, 890.0, 2299.0, 7390.0, 39441.0, 394324.0, 535122.0, 54253.0, 9171.0, 2653.0, 982.0, 514.0, 230.0, 138.0, 85.0, 51.0, 27.0, 17.0, 14.0, 9.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8515625, -5.5980224609375, -5.344482421875, -5.0909423828125, -4.83740234375, -4.5838623046875, -4.330322265625, -4.0767822265625, -3.8232421875, -3.5697021484375, -3.316162109375, -3.0626220703125, -2.80908203125, -2.5555419921875, -2.302001953125, -2.0484619140625, -1.794921875, -1.5413818359375, -1.287841796875, -1.0343017578125, -0.78076171875, -0.5272216796875, -0.273681640625, -0.0201416015625, 0.2333984375, 0.4869384765625, 0.740478515625, 0.9940185546875, 1.24755859375, 1.5010986328125, 1.754638671875, 2.0081787109375, 2.26171875, 2.5152587890625, 2.768798828125, 3.0223388671875, 3.27587890625, 3.5294189453125, 3.782958984375, 4.0364990234375, 4.2900390625, 4.5435791015625, 4.797119140625, 5.0506591796875, 5.30419921875, 5.5577392578125, 5.811279296875, 6.0648193359375, 6.318359375, 6.5718994140625, 6.825439453125, 7.0789794921875, 7.33251953125, 7.5860595703125, 7.839599609375, 8.0931396484375, 8.3466796875, 8.6002197265625, 8.853759765625, 9.1072998046875, 9.36083984375, 9.6143798828125, 9.867919921875, 10.1214599609375, 10.375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 6.0, 10.0, 12.0, 16.0, 30.0, 34.0, 97.0, 191.0, 235.0, 172.0, 92.0, 44.0, 21.0, 12.0, 12.0, 8.0, 2.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.002956390380859375, -0.002895541489124298, -0.002834692597389221, -0.0027738437056541443, -0.0027129948139190674, -0.0026521459221839905, -0.0025912970304489136, -0.0025304481387138367, -0.0024695992469787598, -0.002408750355243683, -0.002347901463508606, -0.002287052571773529, -0.002226203680038452, -0.0021653547883033752, -0.0021045058965682983, -0.0020436570048332214, -0.0019828081130981445, -0.0019219592213630676, -0.0018611103296279907, -0.0018002614378929138, -0.001739412546157837, -0.00167856365442276, -0.001617714762687683, -0.0015568658709526062, -0.0014960169792175293, -0.0014351680874824524, -0.0013743191957473755, -0.0013134703040122986, -0.0012526214122772217, -0.0011917725205421448, -0.0011309236288070679, -0.001070074737071991, -0.001009225845336914, -0.0009483769536018372, -0.0008875280618667603, -0.0008266791701316833, -0.0007658302783966064, -0.0007049813866615295, -0.0006441324949264526, -0.0005832836031913757, -0.0005224347114562988, -0.0004615858197212219, -0.000400736927986145, -0.0003398880362510681, -0.0002790391445159912, -0.0002181902527809143, -0.0001573413610458374, -9.64924693107605e-05, -3.5643577575683594e-05, 2.520531415939331e-05, 8.605420589447021e-05, 0.00014690309762954712, 0.00020775198936462402, 0.00026860088109970093, 0.00032944977283477783, 0.00039029866456985474, 0.00045114755630493164, 0.0005119964480400085, 0.0005728453397750854, 0.0006336942315101624, 0.0006945431232452393, 0.0007553920149803162, 0.0008162409067153931, 0.00087708979845047, 0.0009379386901855469]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 0.0, 5.0, 1.0, 5.0, 3.0, 3.0, 8.0, 12.0, 11.0, 18.0, 17.0, 22.0, 31.0, 43.0, 55.0, 74.0, 140.0, 231.0, 384.0, 756.0, 1781.0, 4510.0, 16199.0, 84138.0, 594679.0, 291619.0, 39147.0, 9133.0, 2906.0, 1146.0, 578.0, 316.0, 190.0, 106.0, 69.0, 55.0, 36.0, 30.0, 24.0, 15.0, 12.0, 10.0, 10.0, 5.0, 3.0, 6.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0], "bins": [-5.796875, -5.59552001953125, -5.3941650390625, -5.19281005859375, -4.991455078125, -4.79010009765625, -4.5887451171875, -4.38739013671875, -4.18603515625, -3.98468017578125, -3.7833251953125, -3.58197021484375, -3.380615234375, -3.17926025390625, -2.9779052734375, -2.77655029296875, -2.5751953125, -2.37384033203125, -2.1724853515625, -1.97113037109375, -1.769775390625, -1.56842041015625, -1.3670654296875, -1.16571044921875, -0.96435546875, -0.76300048828125, -0.5616455078125, -0.36029052734375, -0.158935546875, 0.04241943359375, 0.2437744140625, 0.44512939453125, 0.646484375, 0.84783935546875, 1.0491943359375, 1.25054931640625, 1.451904296875, 1.65325927734375, 1.8546142578125, 2.05596923828125, 2.25732421875, 2.45867919921875, 2.6600341796875, 2.86138916015625, 3.062744140625, 3.26409912109375, 3.4654541015625, 3.66680908203125, 3.8681640625, 4.06951904296875, 4.2708740234375, 4.47222900390625, 4.673583984375, 4.87493896484375, 5.0762939453125, 5.27764892578125, 5.47900390625, 5.68035888671875, 5.8817138671875, 6.08306884765625, 6.284423828125, 6.48577880859375, 6.6871337890625, 6.88848876953125, 7.08984375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 4.0, 4.0, 8.0, 4.0, 10.0, 9.0, 10.0, 18.0, 20.0, 34.0, 38.0, 41.0, 65.0, 66.0, 72.0, 85.0, 60.0, 89.0, 63.0, 53.0, 56.0, 42.0, 28.0, 22.0, 16.0, 15.0, 20.0, 11.0, 5.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.7265625, -3.57257080078125, -3.4185791015625, -3.26458740234375, -3.110595703125, -2.95660400390625, -2.8026123046875, -2.64862060546875, -2.49462890625, -2.34063720703125, -2.1866455078125, -2.03265380859375, -1.878662109375, -1.72467041015625, -1.5706787109375, -1.41668701171875, -1.2626953125, -1.10870361328125, -0.9547119140625, -0.80072021484375, -0.646728515625, -0.49273681640625, -0.3387451171875, -0.18475341796875, -0.03076171875, 0.12322998046875, 0.2772216796875, 0.43121337890625, 0.585205078125, 0.73919677734375, 0.8931884765625, 1.04718017578125, 1.201171875, 1.35516357421875, 1.5091552734375, 1.66314697265625, 1.817138671875, 1.97113037109375, 2.1251220703125, 2.27911376953125, 2.43310546875, 2.58709716796875, 2.7410888671875, 2.89508056640625, 3.049072265625, 3.20306396484375, 3.3570556640625, 3.51104736328125, 3.6650390625, 3.81903076171875, 3.9730224609375, 4.12701416015625, 4.281005859375, 4.43499755859375, 4.5889892578125, 4.74298095703125, 4.89697265625, 5.05096435546875, 5.2049560546875, 5.35894775390625, 5.512939453125, 5.66693115234375, 5.8209228515625, 5.97491455078125, 6.12890625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 9.0, 12.0, 26.0, 52.0, 130.0, 234.0, 240.0, 165.0, 67.0, 32.0, 17.0, 11.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-200.76596069335938, -195.070556640625, -189.37513732910156, -183.6797332763672, -177.98431396484375, -172.28890991210938, -166.593505859375, -160.89808654785156, -155.20266723632812, -149.50726318359375, -143.8118438720703, -138.11643981933594, -132.4210205078125, -126.72561645507812, -121.03020477294922, -115.33479309082031, -109.63938903808594, -103.94397735595703, -98.24856567382812, -92.55316162109375, -86.85774230957031, -81.16233825683594, -75.46692657470703, -69.77151489257812, -64.07610321044922, -58.38069152832031, -52.685279846191406, -46.989871978759766, -41.29446029663086, -35.59904861450195, -29.903640747070312, -24.208229064941406, -18.5128173828125, -12.81740665435791, -7.12199592590332, -1.4265861511230469, 4.268825531005859, 9.964237213134766, 15.659645080566406, 21.355056762695312, 27.05046844482422, 32.745880126953125, 38.44129180908203, 44.13669967651367, 49.83211135864258, 55.527523040771484, 61.222930908203125, 66.91834259033203, 72.61375427246094, 78.30916595458984, 84.00457763671875, 89.69998168945312, 95.39540100097656, 101.09080505371094, 106.78621673583984, 112.48162841796875, 118.17704010009766, 123.87245178222656, 129.56785583496094, 135.26327514648438, 140.95867919921875, 146.6540985107422, 152.34950256347656, 158.044921875, 163.74032592773438]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 6.0, 6.0, 11.0, 8.0, 10.0, 19.0, 12.0, 16.0, 8.0, 12.0, 22.0, 22.0, 27.0, 25.0, 22.0, 35.0, 34.0, 34.0, 28.0, 44.0, 29.0, 36.0, 37.0, 47.0, 33.0, 46.0, 29.0, 44.0, 30.0, 36.0, 18.0, 24.0, 21.0, 19.0, 17.0, 15.0, 16.0, 14.0, 14.0, 9.0, 7.0, 11.0, 9.0, 4.0, 11.0, 6.0, 7.0, 1.0, 3.0, 2.0, 2.0], "bins": [-40.68339920043945, -39.52959060668945, -38.37577819824219, -37.22196960449219, -36.06816101074219, -34.91435241699219, -33.76054382324219, -32.60673141479492, -31.452922821044922, -30.299114227294922, -29.14530372619629, -27.991493225097656, -26.837684631347656, -25.683876037597656, -24.530065536499023, -23.37625503540039, -22.22244644165039, -21.06863784790039, -19.914827346801758, -18.761016845703125, -17.607208251953125, -16.453399658203125, -15.299589157104492, -14.145779609680176, -12.99197006225586, -11.838160514831543, -10.684350967407227, -9.53054141998291, -8.376731872558594, -7.222922325134277, -6.069112777709961, -4.9153032302856445, -3.7614974975585938, -2.6076879501342773, -1.453878402709961, -0.30006885528564453, 0.8537406921386719, 2.0075502395629883, 3.1613597869873047, 4.315169334411621, 5.4689788818359375, 6.622788429260254, 7.77659797668457, 8.930407524108887, 10.084217071533203, 11.23802661895752, 12.391836166381836, 13.545645713806152, 14.699455261230469, 15.853264808654785, 17.0070743560791, 18.160884857177734, 19.314693450927734, 20.468502044677734, 21.622312545776367, 22.776123046875, 23.929931640625, 25.083740234375, 26.237550735473633, 27.391361236572266, 28.545169830322266, 29.698978424072266, 30.8527889251709, 32.00659942626953, 33.16040802001953]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 18.0, 10.0, 23.0, 31.0, 47.0, 80.0, 99.0, 196.0, 342.0, 603.0, 1241.0, 2454.0, 5898.0, 16826.0, 70195.0, 3553189.0, 475656.0, 45585.0, 12476.0, 4734.0, 2171.0, 996.0, 541.0, 329.0, 182.0, 112.0, 62.0, 39.0, 46.0, 25.0, 14.0, 24.0, 8.0, 5.0, 6.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-24.609375, -23.92333984375, -23.2373046875, -22.55126953125, -21.865234375, -21.17919921875, -20.4931640625, -19.80712890625, -19.12109375, -18.43505859375, -17.7490234375, -17.06298828125, -16.376953125, -15.69091796875, -15.0048828125, -14.31884765625, -13.6328125, -12.94677734375, -12.2607421875, -11.57470703125, -10.888671875, -10.20263671875, -9.5166015625, -8.83056640625, -8.14453125, -7.45849609375, -6.7724609375, -6.08642578125, -5.400390625, -4.71435546875, -4.0283203125, -3.34228515625, -2.65625, -1.97021484375, -1.2841796875, -0.59814453125, 0.087890625, 0.77392578125, 1.4599609375, 2.14599609375, 2.83203125, 3.51806640625, 4.2041015625, 4.89013671875, 5.576171875, 6.26220703125, 6.9482421875, 7.63427734375, 8.3203125, 9.00634765625, 9.6923828125, 10.37841796875, 11.064453125, 11.75048828125, 12.4365234375, 13.12255859375, 13.80859375, 14.49462890625, 15.1806640625, 15.86669921875, 16.552734375, 17.23876953125, 17.9248046875, 18.61083984375, 19.296875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 4.0, 6.0, 8.0, 14.0, 26.0, 17.0, 28.0, 36.0, 45.0, 49.0, 71.0, 79.0, 71.0, 73.0, 66.0, 61.0, 67.0, 73.0, 46.0, 43.0, 31.0, 27.0, 19.0, 8.0, 9.0, 11.0, 6.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.20703125, -3.09881591796875, -2.9906005859375, -2.88238525390625, -2.774169921875, -2.66595458984375, -2.5577392578125, -2.44952392578125, -2.34130859375, -2.23309326171875, -2.1248779296875, -2.01666259765625, -1.908447265625, -1.80023193359375, -1.6920166015625, -1.58380126953125, -1.4755859375, -1.36737060546875, -1.2591552734375, -1.15093994140625, -1.042724609375, -0.93450927734375, -0.8262939453125, -0.71807861328125, -0.60986328125, -0.50164794921875, -0.3934326171875, -0.28521728515625, -0.177001953125, -0.06878662109375, 0.0394287109375, 0.14764404296875, 0.255859375, 0.36407470703125, 0.4722900390625, 0.58050537109375, 0.688720703125, 0.79693603515625, 0.9051513671875, 1.01336669921875, 1.12158203125, 1.22979736328125, 1.3380126953125, 1.44622802734375, 1.554443359375, 1.66265869140625, 1.7708740234375, 1.87908935546875, 1.9873046875, 2.09552001953125, 2.2037353515625, 2.31195068359375, 2.420166015625, 2.52838134765625, 2.6365966796875, 2.74481201171875, 2.85302734375, 2.96124267578125, 3.0694580078125, 3.17767333984375, 3.285888671875, 3.39410400390625, 3.5023193359375, 3.61053466796875, 3.71875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 8.0, 7.0, 11.0, 13.0, 17.0, 17.0, 31.0, 42.0, 82.0, 126.0, 189.0, 378.0, 731.0, 1486.0, 3668.0, 9912.0, 37810.0, 284804.0, 3710475.0, 111638.0, 21513.0, 6465.0, 2514.0, 1131.0, 531.0, 258.0, 138.0, 87.0, 60.0, 37.0, 30.0, 22.0, 14.0, 16.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-26.890625, -26.20654296875, -25.5224609375, -24.83837890625, -24.154296875, -23.47021484375, -22.7861328125, -22.10205078125, -21.41796875, -20.73388671875, -20.0498046875, -19.36572265625, -18.681640625, -17.99755859375, -17.3134765625, -16.62939453125, -15.9453125, -15.26123046875, -14.5771484375, -13.89306640625, -13.208984375, -12.52490234375, -11.8408203125, -11.15673828125, -10.47265625, -9.78857421875, -9.1044921875, -8.42041015625, -7.736328125, -7.05224609375, -6.3681640625, -5.68408203125, -5.0, -4.31591796875, -3.6318359375, -2.94775390625, -2.263671875, -1.57958984375, -0.8955078125, -0.21142578125, 0.47265625, 1.15673828125, 1.8408203125, 2.52490234375, 3.208984375, 3.89306640625, 4.5771484375, 5.26123046875, 5.9453125, 6.62939453125, 7.3134765625, 7.99755859375, 8.681640625, 9.36572265625, 10.0498046875, 10.73388671875, 11.41796875, 12.10205078125, 12.7861328125, 13.47021484375, 14.154296875, 14.83837890625, 15.5224609375, 16.20654296875, 16.890625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 6.0, 6.0, 10.0, 6.0, 14.0, 18.0, 33.0, 47.0, 63.0, 99.0, 209.0, 915.0, 2060.0, 267.0, 113.0, 64.0, 42.0, 32.0, 18.0, 18.0, 7.0, 6.0, 6.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-11.171875, -10.91845703125, -10.6650390625, -10.41162109375, -10.158203125, -9.90478515625, -9.6513671875, -9.39794921875, -9.14453125, -8.89111328125, -8.6376953125, -8.38427734375, -8.130859375, -7.87744140625, -7.6240234375, -7.37060546875, -7.1171875, -6.86376953125, -6.6103515625, -6.35693359375, -6.103515625, -5.85009765625, -5.5966796875, -5.34326171875, -5.08984375, -4.83642578125, -4.5830078125, -4.32958984375, -4.076171875, -3.82275390625, -3.5693359375, -3.31591796875, -3.0625, -2.80908203125, -2.5556640625, -2.30224609375, -2.048828125, -1.79541015625, -1.5419921875, -1.28857421875, -1.03515625, -0.78173828125, -0.5283203125, -0.27490234375, -0.021484375, 0.23193359375, 0.4853515625, 0.73876953125, 0.9921875, 1.24560546875, 1.4990234375, 1.75244140625, 2.005859375, 2.25927734375, 2.5126953125, 2.76611328125, 3.01953125, 3.27294921875, 3.5263671875, 3.77978515625, 4.033203125, 4.28662109375, 4.5400390625, 4.79345703125, 5.046875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 11.0, 28.0, 82.0, 155.0, 299.0, 245.0, 124.0, 32.0, 9.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-124.60200500488281, -122.15337371826172, -119.70474243164062, -117.25611114501953, -114.80747985839844, -112.35885620117188, -109.91022491455078, -107.46159362792969, -105.0129623413086, -102.5643310546875, -100.1156997680664, -97.66706848144531, -95.21844482421875, -92.76981353759766, -90.32118225097656, -87.87255096435547, -85.42391967773438, -82.97528839111328, -80.52665710449219, -78.0780258178711, -75.62939453125, -73.18077087402344, -70.73213958740234, -68.28350830078125, -65.83487701416016, -63.38624572753906, -60.93761444091797, -58.48898696899414, -56.04035568237305, -53.59172439575195, -51.143096923828125, -48.69446563720703, -46.24583435058594, -43.797203063964844, -41.34857177734375, -38.89994430541992, -36.45131301879883, -34.002681732177734, -31.554052352905273, -29.105422973632812, -26.65679168701172, -24.208160400390625, -21.759531021118164, -19.310901641845703, -16.86227035522461, -14.413640022277832, -11.965009689331055, -9.516380310058594, -7.0677490234375, -4.619118690490723, -2.1704883575439453, 0.27814197540283203, 2.7267723083496094, 5.175402641296387, 7.624032974243164, 10.072662353515625, 12.521293640136719, 14.969923973083496, 17.418554306030273, 19.867183685302734, 22.315814971923828, 24.764446258544922, 27.213075637817383, 29.661705017089844, 32.11033630371094]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 5.0, 5.0, 5.0, 9.0, 9.0, 9.0, 14.0, 16.0, 18.0, 21.0, 21.0, 34.0, 40.0, 45.0, 36.0, 29.0, 41.0, 42.0, 47.0, 51.0, 50.0, 46.0, 49.0, 38.0, 39.0, 35.0, 31.0, 41.0, 27.0, 22.0, 26.0, 19.0, 16.0, 9.0, 10.0, 14.0, 7.0, 8.0, 7.0, 1.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.26411247253418, -20.590425491333008, -19.916738510131836, -19.243053436279297, -18.569366455078125, -17.895679473876953, -17.22199249267578, -16.54830551147461, -15.874619483947754, -15.200932502746582, -14.527246475219727, -13.853559494018555, -13.179872512817383, -12.506186485290527, -11.832499504089355, -11.1588134765625, -10.485126495361328, -9.811439514160156, -9.1377534866333, -8.464066505432129, -7.790380001068115, -7.116693496704102, -6.44300651550293, -5.769320011138916, -5.095633506774902, -4.421947002410889, -3.748260259628296, -3.074573516845703, -2.4008870124816895, -1.7272005081176758, -1.053513526916504, -0.37982702255249023, 0.2938575744628906, 0.9675441980361938, 1.641230821609497, 2.31491756439209, 2.9886040687561035, 3.662290573120117, 4.335977554321289, 5.009664058685303, 5.683350563049316, 6.35703706741333, 7.030723571777344, 7.704410552978516, 8.378097534179688, 9.051783561706543, 9.725470542907715, 10.39915657043457, 11.072843551635742, 11.746530532836914, 12.42021656036377, 13.093903541564941, 13.767589569091797, 14.441276550292969, 15.11496353149414, 15.788650512695312, 16.462337493896484, 17.136024475097656, 17.809711456298828, 18.4833984375, 19.15708351135254, 19.83077049255371, 20.504457473754883, 21.178144454956055, 21.851829528808594]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 19.0, 21.0, 31.0, 43.0, 66.0, 107.0, 177.0, 279.0, 415.0, 631.0, 1051.0, 1703.0, 2805.0, 4775.0, 8393.0, 15096.0, 29168.0, 56631.0, 113731.0, 215854.0, 267364.0, 159961.0, 81033.0, 40930.0, 21212.0, 11406.0, 6385.0, 3557.0, 2200.0, 1278.0, 822.0, 504.0, 328.0, 191.0, 143.0, 67.0, 68.0, 34.0, 22.0, 14.0, 12.0, 6.0, 4.0, 7.0, 6.0, 1.0, 0.0, 1.0], "bins": [-13.2109375, -12.8465576171875, -12.482177734375, -12.1177978515625, -11.75341796875, -11.3890380859375, -11.024658203125, -10.6602783203125, -10.2958984375, -9.9315185546875, -9.567138671875, -9.2027587890625, -8.83837890625, -8.4739990234375, -8.109619140625, -7.7452392578125, -7.380859375, -7.0164794921875, -6.652099609375, -6.2877197265625, -5.92333984375, -5.5589599609375, -5.194580078125, -4.8302001953125, -4.4658203125, -4.1014404296875, -3.737060546875, -3.3726806640625, -3.00830078125, -2.6439208984375, -2.279541015625, -1.9151611328125, -1.55078125, -1.1864013671875, -0.822021484375, -0.4576416015625, -0.09326171875, 0.2711181640625, 0.635498046875, 0.9998779296875, 1.3642578125, 1.7286376953125, 2.093017578125, 2.4573974609375, 2.82177734375, 3.1861572265625, 3.550537109375, 3.9149169921875, 4.279296875, 4.6436767578125, 5.008056640625, 5.3724365234375, 5.73681640625, 6.1011962890625, 6.465576171875, 6.8299560546875, 7.1943359375, 7.5587158203125, 7.923095703125, 8.2874755859375, 8.65185546875, 9.0162353515625, 9.380615234375, 9.7449951171875, 10.109375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 6.0, 3.0, 6.0, 8.0, 4.0, 7.0, 16.0, 17.0, 28.0, 29.0, 24.0, 36.0, 48.0, 55.0, 61.0, 46.0, 71.0, 53.0, 70.0, 74.0, 68.0, 51.0, 44.0, 38.0, 30.0, 27.0, 24.0, 18.0, 11.0, 12.0, 8.0, 4.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.17578125, -3.067901611328125, -2.96002197265625, -2.852142333984375, -2.7442626953125, -2.636383056640625, -2.52850341796875, -2.420623779296875, -2.312744140625, -2.204864501953125, -2.09698486328125, -1.989105224609375, -1.8812255859375, -1.773345947265625, -1.66546630859375, -1.557586669921875, -1.44970703125, -1.341827392578125, -1.23394775390625, -1.126068115234375, -1.0181884765625, -0.910308837890625, -0.80242919921875, -0.694549560546875, -0.586669921875, -0.478790283203125, -0.37091064453125, -0.263031005859375, -0.1551513671875, -0.047271728515625, 0.06060791015625, 0.168487548828125, 0.2763671875, 0.384246826171875, 0.49212646484375, 0.600006103515625, 0.7078857421875, 0.815765380859375, 0.92364501953125, 1.031524658203125, 1.139404296875, 1.247283935546875, 1.35516357421875, 1.463043212890625, 1.5709228515625, 1.678802490234375, 1.78668212890625, 1.894561767578125, 2.00244140625, 2.110321044921875, 2.21820068359375, 2.326080322265625, 2.4339599609375, 2.541839599609375, 2.64971923828125, 2.757598876953125, 2.865478515625, 2.973358154296875, 3.08123779296875, 3.189117431640625, 3.2969970703125, 3.404876708984375, 3.51275634765625, 3.620635986328125, 3.728515625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 12.0, 10.0, 16.0, 9.0, 17.0, 32.0, 51.0, 72.0, 97.0, 161.0, 249.0, 367.0, 622.0, 1068.0, 2055.0, 4272.0, 10152.0, 27555.0, 91069.0, 327149.0, 407288.0, 118536.0, 34773.0, 12363.0, 5063.0, 2382.0, 1252.0, 677.0, 394.0, 265.0, 167.0, 113.0, 90.0, 52.0, 30.0, 24.0, 11.0, 12.0, 10.0, 6.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.421875, -18.835205078125, -18.24853515625, -17.661865234375, -17.0751953125, -16.488525390625, -15.90185546875, -15.315185546875, -14.728515625, -14.141845703125, -13.55517578125, -12.968505859375, -12.3818359375, -11.795166015625, -11.20849609375, -10.621826171875, -10.03515625, -9.448486328125, -8.86181640625, -8.275146484375, -7.6884765625, -7.101806640625, -6.51513671875, -5.928466796875, -5.341796875, -4.755126953125, -4.16845703125, -3.581787109375, -2.9951171875, -2.408447265625, -1.82177734375, -1.235107421875, -0.6484375, -0.061767578125, 0.52490234375, 1.111572265625, 1.6982421875, 2.284912109375, 2.87158203125, 3.458251953125, 4.044921875, 4.631591796875, 5.21826171875, 5.804931640625, 6.3916015625, 6.978271484375, 7.56494140625, 8.151611328125, 8.73828125, 9.324951171875, 9.91162109375, 10.498291015625, 11.0849609375, 11.671630859375, 12.25830078125, 12.844970703125, 13.431640625, 14.018310546875, 14.60498046875, 15.191650390625, 15.7783203125, 16.364990234375, 16.95166015625, 17.538330078125, 18.125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 6.0, 7.0, 8.0, 16.0, 13.0, 22.0, 17.0, 21.0, 27.0, 25.0, 35.0, 36.0, 31.0, 48.0, 34.0, 57.0, 48.0, 56.0, 52.0, 53.0, 46.0, 31.0, 36.0, 36.0, 31.0, 38.0, 33.0, 22.0, 17.0, 14.0, 15.0, 11.0, 13.0, 8.0, 6.0, 2.0, 9.0, 3.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.9296875, -12.5113525390625, -12.093017578125, -11.6746826171875, -11.25634765625, -10.8380126953125, -10.419677734375, -10.0013427734375, -9.5830078125, -9.1646728515625, -8.746337890625, -8.3280029296875, -7.90966796875, -7.4913330078125, -7.072998046875, -6.6546630859375, -6.236328125, -5.8179931640625, -5.399658203125, -4.9813232421875, -4.56298828125, -4.1446533203125, -3.726318359375, -3.3079833984375, -2.8896484375, -2.4713134765625, -2.052978515625, -1.6346435546875, -1.21630859375, -0.7979736328125, -0.379638671875, 0.0386962890625, 0.45703125, 0.8753662109375, 1.293701171875, 1.7120361328125, 2.13037109375, 2.5487060546875, 2.967041015625, 3.3853759765625, 3.8037109375, 4.2220458984375, 4.640380859375, 5.0587158203125, 5.47705078125, 5.8953857421875, 6.313720703125, 6.7320556640625, 7.150390625, 7.5687255859375, 7.987060546875, 8.4053955078125, 8.82373046875, 9.2420654296875, 9.660400390625, 10.0787353515625, 10.4970703125, 10.9154052734375, 11.333740234375, 11.7520751953125, 12.17041015625, 12.5887451171875, 13.007080078125, 13.4254150390625, 13.84375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 10.0, 19.0, 22.0, 47.0, 90.0, 117.0, 251.0, 551.0, 1282.0, 4355.0, 20594.0, 264504.0, 711593.0, 35600.0, 6405.0, 1789.0, 666.0, 309.0, 156.0, 82.0, 39.0, 26.0, 21.0, 11.0, 7.0, 6.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-29.0625, -28.3887939453125, -27.715087890625, -27.0413818359375, -26.36767578125, -25.6939697265625, -25.020263671875, -24.3465576171875, -23.6728515625, -22.9991455078125, -22.325439453125, -21.6517333984375, -20.97802734375, -20.3043212890625, -19.630615234375, -18.9569091796875, -18.283203125, -17.6094970703125, -16.935791015625, -16.2620849609375, -15.58837890625, -14.9146728515625, -14.240966796875, -13.5672607421875, -12.8935546875, -12.2198486328125, -11.546142578125, -10.8724365234375, -10.19873046875, -9.5250244140625, -8.851318359375, -8.1776123046875, -7.50390625, -6.8302001953125, -6.156494140625, -5.4827880859375, -4.80908203125, -4.1353759765625, -3.461669921875, -2.7879638671875, -2.1142578125, -1.4405517578125, -0.766845703125, -0.0931396484375, 0.58056640625, 1.2542724609375, 1.927978515625, 2.6016845703125, 3.275390625, 3.9490966796875, 4.622802734375, 5.2965087890625, 5.97021484375, 6.6439208984375, 7.317626953125, 7.9913330078125, 8.6650390625, 9.3387451171875, 10.012451171875, 10.6861572265625, 11.35986328125, 12.0335693359375, 12.707275390625, 13.3809814453125, 14.0546875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 5.0, 5.0, 20.0, 16.0, 14.0, 34.0, 50.0, 64.0, 98.0, 150.0, 174.0, 113.0, 79.0, 39.0, 35.0, 29.0, 20.0, 18.0, 12.0, 5.0, 4.0, 8.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00206756591796875, -0.0020033419132232666, -0.0019391179084777832, -0.0018748939037322998, -0.0018106698989868164, -0.001746445894241333, -0.0016822218894958496, -0.0016179978847503662, -0.0015537738800048828, -0.0014895498752593994, -0.001425325870513916, -0.0013611018657684326, -0.0012968778610229492, -0.0012326538562774658, -0.0011684298515319824, -0.001104205846786499, -0.0010399818420410156, -0.0009757578372955322, -0.0009115338325500488, -0.0008473098278045654, -0.000783085823059082, -0.0007188618183135986, -0.0006546378135681152, -0.0005904138088226318, -0.0005261898040771484, -0.00046196579933166504, -0.00039774179458618164, -0.00033351778984069824, -0.00026929378509521484, -0.00020506978034973145, -0.00014084577560424805, -7.662177085876465e-05, -1.239776611328125e-05, 5.182623863220215e-05, 0.00011605024337768555, 0.00018027424812316895, 0.00024449825286865234, 0.00030872225761413574, 0.00037294626235961914, 0.00043717026710510254, 0.0005013942718505859, 0.0005656182765960693, 0.0006298422813415527, 0.0006940662860870361, 0.0007582902908325195, 0.0008225142955780029, 0.0008867383003234863, 0.0009509623050689697, 0.0010151863098144531, 0.0010794103145599365, 0.00114363431930542, 0.0012078583240509033, 0.0012720823287963867, 0.0013363063335418701, 0.0014005303382873535, 0.001464754343032837, 0.0015289783477783203, 0.0015932023525238037, 0.0016574263572692871, 0.0017216503620147705, 0.001785874366760254, 0.0018500983715057373, 0.0019143223762512207, 0.001978546380996704, 0.0020427703857421875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 7.0, 12.0, 15.0, 29.0, 41.0, 49.0, 98.0, 172.0, 361.0, 862.0, 2567.0, 12023.0, 167365.0, 824246.0, 33336.0, 4934.0, 1383.0, 550.0, 201.0, 111.0, 65.0, 44.0, 30.0, 18.0, 7.0, 8.0, 10.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.09375, -21.311279296875, -20.52880859375, -19.746337890625, -18.9638671875, -18.181396484375, -17.39892578125, -16.616455078125, -15.833984375, -15.051513671875, -14.26904296875, -13.486572265625, -12.7041015625, -11.921630859375, -11.13916015625, -10.356689453125, -9.57421875, -8.791748046875, -8.00927734375, -7.226806640625, -6.4443359375, -5.661865234375, -4.87939453125, -4.096923828125, -3.314453125, -2.531982421875, -1.74951171875, -0.967041015625, -0.1845703125, 0.597900390625, 1.38037109375, 2.162841796875, 2.9453125, 3.727783203125, 4.51025390625, 5.292724609375, 6.0751953125, 6.857666015625, 7.64013671875, 8.422607421875, 9.205078125, 9.987548828125, 10.77001953125, 11.552490234375, 12.3349609375, 13.117431640625, 13.89990234375, 14.682373046875, 15.46484375, 16.247314453125, 17.02978515625, 17.812255859375, 18.5947265625, 19.377197265625, 20.15966796875, 20.942138671875, 21.724609375, 22.507080078125, 23.28955078125, 24.072021484375, 24.8544921875, 25.636962890625, 26.41943359375, 27.201904296875, 27.984375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 2.0, 8.0, 4.0, 9.0, 10.0, 11.0, 14.0, 18.0, 26.0, 29.0, 38.0, 68.0, 87.0, 152.0, 166.0, 118.0, 55.0, 40.0, 32.0, 24.0, 10.0, 9.0, 11.0, 17.0, 9.0, 7.0, 5.0, 2.0, 5.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.8984375, -15.4324951171875, -14.966552734375, -14.5006103515625, -14.03466796875, -13.5687255859375, -13.102783203125, -12.6368408203125, -12.1708984375, -11.7049560546875, -11.239013671875, -10.7730712890625, -10.30712890625, -9.8411865234375, -9.375244140625, -8.9093017578125, -8.443359375, -7.9774169921875, -7.511474609375, -7.0455322265625, -6.57958984375, -6.1136474609375, -5.647705078125, -5.1817626953125, -4.7158203125, -4.2498779296875, -3.783935546875, -3.3179931640625, -2.85205078125, -2.3861083984375, -1.920166015625, -1.4542236328125, -0.98828125, -0.5223388671875, -0.056396484375, 0.4095458984375, 0.87548828125, 1.3414306640625, 1.807373046875, 2.2733154296875, 2.7392578125, 3.2052001953125, 3.671142578125, 4.1370849609375, 4.60302734375, 5.0689697265625, 5.534912109375, 6.0008544921875, 6.466796875, 6.9327392578125, 7.398681640625, 7.8646240234375, 8.33056640625, 8.7965087890625, 9.262451171875, 9.7283935546875, 10.1943359375, 10.6602783203125, 11.126220703125, 11.5921630859375, 12.05810546875, 12.5240478515625, 12.989990234375, 13.4559326171875, 13.921875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 14.0, 44.0, 136.0, 269.0, 302.0, 159.0, 45.0, 19.0, 8.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-546.0494384765625, -532.0891723632812, -518.1288452148438, -504.1685791015625, -490.2082824707031, -476.24798583984375, -462.2876892089844, -448.327392578125, -434.36712646484375, -420.4068298339844, -406.446533203125, -392.48626708984375, -378.5259704589844, -364.565673828125, -350.6053771972656, -336.64508056640625, -322.6847839355469, -308.7244873046875, -294.7641906738281, -280.80389404296875, -266.8436279296875, -252.88333129882812, -238.92303466796875, -224.96273803710938, -211.00245666503906, -197.0421600341797, -183.08187866210938, -169.12158203125, -155.16128540039062, -141.2010040283203, -127.24070739746094, -113.2804183959961, -99.32015991210938, -85.35987091064453, -71.39958190917969, -57.43928527832031, -43.47899627685547, -29.518707275390625, -15.55841064453125, -1.5981216430664062, 12.362167358398438, 26.322458267211914, 40.28274917602539, 54.2430419921875, 68.20333099365234, 82.16361999511719, 96.12391662597656, 110.0842056274414, 124.04449462890625, 138.00479125976562, 151.96507263183594, 165.9253692626953, 179.88565063476562, 193.845947265625, 207.80624389648438, 221.76654052734375, 235.72682189941406, 249.68711853027344, 263.64739990234375, 277.6076965332031, 291.5679931640625, 305.52825927734375, 319.48858642578125, 333.4488525390625, 347.4091491699219]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 2.0, 5.0, 6.0, 4.0, 7.0, 9.0, 13.0, 11.0, 10.0, 12.0, 13.0, 24.0, 23.0, 30.0, 32.0, 26.0, 46.0, 34.0, 49.0, 47.0, 50.0, 41.0, 41.0, 46.0, 37.0, 47.0, 39.0, 29.0, 33.0, 33.0, 29.0, 32.0, 24.0, 14.0, 18.0, 16.0, 5.0, 13.0, 5.0, 7.0, 11.0, 5.0, 6.0, 4.0, 8.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.2705078125, -71.7385482788086, -69.20658111572266, -66.67462158203125, -64.14265441894531, -61.61069107055664, -59.07872772216797, -56.54676818847656, -54.014801025390625, -51.48283767700195, -48.95087432861328, -46.41891098022461, -43.88694763183594, -41.354984283447266, -38.823020935058594, -36.29106140136719, -33.759098052978516, -31.227134704589844, -28.695171356201172, -26.1632080078125, -23.631244659423828, -21.099281311035156, -18.567319869995117, -16.035356521606445, -13.503393173217773, -10.971429824829102, -8.43946647644043, -5.907504081726074, -3.3755407333374023, -0.8435773849487305, 1.688385009765625, 4.220348358154297, 6.752311706542969, 9.28427505493164, 11.816238403320312, 14.348200798034668, 16.880165100097656, 19.412128448486328, 21.944089889526367, 24.47605323791504, 27.00801658630371, 29.539979934692383, 32.07194137573242, 34.603904724121094, 37.135868072509766, 39.66783142089844, 42.19979476928711, 44.73175811767578, 47.26372146606445, 49.795684814453125, 52.3276481628418, 54.85961151123047, 57.39157485961914, 59.92353820800781, 62.45549774169922, 64.98746490478516, 67.51942443847656, 70.05138397216797, 72.5833511352539, 75.11531066894531, 77.64727783203125, 80.17923736572266, 82.7112045288086, 85.2431640625, 87.77513122558594]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 5.0, 3.0, 9.0, 19.0, 23.0, 40.0, 52.0, 111.0, 214.0, 382.0, 735.0, 1497.0, 3332.0, 8339.0, 25010.0, 118945.0, 3742260.0, 236318.0, 37554.0, 11161.0, 4310.0, 1886.0, 935.0, 532.0, 272.0, 152.0, 96.0, 41.0, 26.0, 18.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.390625, -25.469482421875, -24.54833984375, -23.627197265625, -22.7060546875, -21.784912109375, -20.86376953125, -19.942626953125, -19.021484375, -18.100341796875, -17.17919921875, -16.258056640625, -15.3369140625, -14.415771484375, -13.49462890625, -12.573486328125, -11.65234375, -10.731201171875, -9.81005859375, -8.888916015625, -7.9677734375, -7.046630859375, -6.12548828125, -5.204345703125, -4.283203125, -3.362060546875, -2.44091796875, -1.519775390625, -0.5986328125, 0.322509765625, 1.24365234375, 2.164794921875, 3.0859375, 4.007080078125, 4.92822265625, 5.849365234375, 6.7705078125, 7.691650390625, 8.61279296875, 9.533935546875, 10.455078125, 11.376220703125, 12.29736328125, 13.218505859375, 14.1396484375, 15.060791015625, 15.98193359375, 16.903076171875, 17.82421875, 18.745361328125, 19.66650390625, 20.587646484375, 21.5087890625, 22.429931640625, 23.35107421875, 24.272216796875, 25.193359375, 26.114501953125, 27.03564453125, 27.956787109375, 28.8779296875, 29.799072265625, 30.72021484375, 31.641357421875, 32.5625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 7.0, 10.0, 15.0, 12.0, 10.0, 20.0, 24.0, 35.0, 37.0, 58.0, 49.0, 37.0, 67.0, 79.0, 77.0, 47.0, 57.0, 56.0, 62.0, 38.0, 49.0, 33.0, 30.0, 16.0, 18.0, 15.0, 15.0, 10.0, 7.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.88671875, -4.752716064453125, -4.61871337890625, -4.484710693359375, -4.3507080078125, -4.216705322265625, -4.08270263671875, -3.948699951171875, -3.814697265625, -3.680694580078125, -3.54669189453125, -3.412689208984375, -3.2786865234375, -3.144683837890625, -3.01068115234375, -2.876678466796875, -2.74267578125, -2.608673095703125, -2.47467041015625, -2.340667724609375, -2.2066650390625, -2.072662353515625, -1.93865966796875, -1.804656982421875, -1.670654296875, -1.536651611328125, -1.40264892578125, -1.268646240234375, -1.1346435546875, -1.000640869140625, -0.86663818359375, -0.732635498046875, -0.5986328125, -0.464630126953125, -0.33062744140625, -0.196624755859375, -0.0626220703125, 0.071380615234375, 0.20538330078125, 0.339385986328125, 0.473388671875, 0.607391357421875, 0.74139404296875, 0.875396728515625, 1.0093994140625, 1.143402099609375, 1.27740478515625, 1.411407470703125, 1.54541015625, 1.679412841796875, 1.81341552734375, 1.947418212890625, 2.0814208984375, 2.215423583984375, 2.34942626953125, 2.483428955078125, 2.617431640625, 2.751434326171875, 2.88543701171875, 3.019439697265625, 3.1534423828125, 3.287445068359375, 3.42144775390625, 3.555450439453125, 3.689453125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 6.0, 7.0, 12.0, 14.0, 12.0, 19.0, 30.0, 53.0, 78.0, 99.0, 153.0, 239.0, 481.0, 1119.0, 3287.0, 12480.0, 79392.0, 3873626.0, 194935.0, 20329.0, 4946.0, 1552.0, 575.0, 280.0, 186.0, 112.0, 81.0, 46.0, 43.0, 22.0, 21.0, 16.0, 8.0, 9.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-52.625, -51.0615234375, -49.498046875, -47.9345703125, -46.37109375, -44.8076171875, -43.244140625, -41.6806640625, -40.1171875, -38.5537109375, -36.990234375, -35.4267578125, -33.86328125, -32.2998046875, -30.736328125, -29.1728515625, -27.609375, -26.0458984375, -24.482421875, -22.9189453125, -21.35546875, -19.7919921875, -18.228515625, -16.6650390625, -15.1015625, -13.5380859375, -11.974609375, -10.4111328125, -8.84765625, -7.2841796875, -5.720703125, -4.1572265625, -2.59375, -1.0302734375, 0.533203125, 2.0966796875, 3.66015625, 5.2236328125, 6.787109375, 8.3505859375, 9.9140625, 11.4775390625, 13.041015625, 14.6044921875, 16.16796875, 17.7314453125, 19.294921875, 20.8583984375, 22.421875, 23.9853515625, 25.548828125, 27.1123046875, 28.67578125, 30.2392578125, 31.802734375, 33.3662109375, 34.9296875, 36.4931640625, 38.056640625, 39.6201171875, 41.18359375, 42.7470703125, 44.310546875, 45.8740234375, 47.4375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 6.0, 5.0, 18.0, 24.0, 47.0, 118.0, 287.0, 2746.0, 554.0, 134.0, 58.0, 32.0, 19.0, 4.0, 3.0, 9.0, 4.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.09375, -21.19873046875, -20.3037109375, -19.40869140625, -18.513671875, -17.61865234375, -16.7236328125, -15.82861328125, -14.93359375, -14.03857421875, -13.1435546875, -12.24853515625, -11.353515625, -10.45849609375, -9.5634765625, -8.66845703125, -7.7734375, -6.87841796875, -5.9833984375, -5.08837890625, -4.193359375, -3.29833984375, -2.4033203125, -1.50830078125, -0.61328125, 0.28173828125, 1.1767578125, 2.07177734375, 2.966796875, 3.86181640625, 4.7568359375, 5.65185546875, 6.546875, 7.44189453125, 8.3369140625, 9.23193359375, 10.126953125, 11.02197265625, 11.9169921875, 12.81201171875, 13.70703125, 14.60205078125, 15.4970703125, 16.39208984375, 17.287109375, 18.18212890625, 19.0771484375, 19.97216796875, 20.8671875, 21.76220703125, 22.6572265625, 23.55224609375, 24.447265625, 25.34228515625, 26.2373046875, 27.13232421875, 28.02734375, 28.92236328125, 29.8173828125, 30.71240234375, 31.607421875, 32.50244140625, 33.3974609375, 34.29248046875, 35.1875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 19.0, 122.0, 513.0, 292.0, 43.0, 12.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-533.2161865234375, -521.8177490234375, -510.4193115234375, -499.0208740234375, -487.6224060058594, -476.2239685058594, -464.8255310058594, -453.4270935058594, -442.0286560058594, -430.6302185058594, -419.2317810058594, -407.83331298828125, -396.43487548828125, -385.03643798828125, -373.63800048828125, -362.23956298828125, -350.84112548828125, -339.44268798828125, -328.04425048828125, -316.64581298828125, -305.2473449707031, -293.8489074707031, -282.4504699707031, -271.0520324707031, -259.653564453125, -248.255126953125, -236.85667419433594, -225.45823669433594, -214.05979919433594, -202.66134643554688, -191.26290893554688, -179.86447143554688, -168.46604919433594, -157.06761169433594, -145.66915893554688, -134.27072143554688, -122.87228393554688, -111.47383880615234, -100.07539367675781, -88.67695617675781, -77.27851104736328, -65.88006591796875, -54.48162841796875, -43.08318328857422, -31.684741973876953, -20.286300659179688, -8.887855529785156, 2.5105819702148438, 13.909027099609375, 25.30746841430664, 36.705909729003906, 48.10435485839844, 59.5027961730957, 70.90123748779297, 82.2996826171875, 93.6981201171875, 105.09656524658203, 116.49501037597656, 127.89344787597656, 139.29190063476562, 150.69033813476562, 162.08877563476562, 173.48721313476562, 184.88565063476562, 196.2841033935547]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 6.0, 9.0, 11.0, 8.0, 20.0, 21.0, 30.0, 43.0, 38.0, 58.0, 57.0, 49.0, 64.0, 64.0, 55.0, 75.0, 67.0, 66.0, 40.0, 56.0, 34.0, 33.0, 16.0, 19.0, 17.0, 14.0, 14.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.24303436279297, -66.18338775634766, -64.12373352050781, -62.0640869140625, -60.00444030761719, -57.94478988647461, -55.88513946533203, -53.82549285888672, -51.76584243774414, -49.70619201660156, -47.64654541015625, -45.58689498901367, -43.527244567871094, -41.46759796142578, -39.4079475402832, -37.348297119140625, -35.28865051269531, -33.229000091552734, -31.169353485107422, -29.109703063964844, -27.0500545501709, -24.990406036376953, -22.930755615234375, -20.87110710144043, -18.811458587646484, -16.75181007385254, -14.692160606384277, -12.632511138916016, -10.57286262512207, -8.513214111328125, -6.453564643859863, -4.393915176391602, -2.3342666625976562, -0.27461767196655273, 1.7850313186645508, 3.8446803092956543, 5.904329299926758, 7.963977813720703, 10.023627281188965, 12.083276748657227, 14.142925262451172, 16.202573776245117, 18.262222290039062, 20.32187271118164, 22.381521224975586, 24.44116973876953, 26.50082015991211, 28.560468673706055, 30.6201171875, 32.67976760864258, 34.73941421508789, 36.79906463623047, 38.85871124267578, 40.91836166381836, 42.97801208496094, 45.03765869140625, 47.09730911254883, 49.156959533691406, 51.21660614013672, 53.2762565612793, 55.335906982421875, 57.39555358886719, 59.455204010009766, 61.514854431152344, 63.574501037597656]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 1.0, 3.0, 3.0, 9.0, 8.0, 8.0, 12.0, 24.0, 54.0, 66.0, 91.0, 128.0, 216.0, 314.0, 505.0, 791.0, 1158.0, 1858.0, 2972.0, 4576.0, 7573.0, 12969.0, 22815.0, 41802.0, 78808.0, 143306.0, 217849.0, 211913.0, 134126.0, 72804.0, 38973.0, 21341.0, 12322.0, 7234.0, 4392.0, 2686.0, 1647.0, 1108.0, 729.0, 454.0, 286.0, 204.0, 134.0, 103.0, 53.0, 36.0, 32.0, 14.0, 18.0, 16.0, 2.0, 5.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.515625, -13.064208984375, -12.61279296875, -12.161376953125, -11.7099609375, -11.258544921875, -10.80712890625, -10.355712890625, -9.904296875, -9.452880859375, -9.00146484375, -8.550048828125, -8.0986328125, -7.647216796875, -7.19580078125, -6.744384765625, -6.29296875, -5.841552734375, -5.39013671875, -4.938720703125, -4.4873046875, -4.035888671875, -3.58447265625, -3.133056640625, -2.681640625, -2.230224609375, -1.77880859375, -1.327392578125, -0.8759765625, -0.424560546875, 0.02685546875, 0.478271484375, 0.9296875, 1.381103515625, 1.83251953125, 2.283935546875, 2.7353515625, 3.186767578125, 3.63818359375, 4.089599609375, 4.541015625, 4.992431640625, 5.44384765625, 5.895263671875, 6.3466796875, 6.798095703125, 7.24951171875, 7.700927734375, 8.15234375, 8.603759765625, 9.05517578125, 9.506591796875, 9.9580078125, 10.409423828125, 10.86083984375, 11.312255859375, 11.763671875, 12.215087890625, 12.66650390625, 13.117919921875, 13.5693359375, 14.020751953125, 14.47216796875, 14.923583984375, 15.375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 9.0, 7.0, 16.0, 9.0, 11.0, 20.0, 25.0, 29.0, 34.0, 28.0, 39.0, 48.0, 39.0, 56.0, 39.0, 65.0, 52.0, 46.0, 50.0, 43.0, 49.0, 29.0, 39.0, 45.0, 30.0, 30.0, 14.0, 21.0, 11.0, 15.0, 10.0, 6.0, 8.0, 8.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.4375, -4.30853271484375, -4.1795654296875, -4.05059814453125, -3.921630859375, -3.79266357421875, -3.6636962890625, -3.53472900390625, -3.40576171875, -3.27679443359375, -3.1478271484375, -3.01885986328125, -2.889892578125, -2.76092529296875, -2.6319580078125, -2.50299072265625, -2.3740234375, -2.24505615234375, -2.1160888671875, -1.98712158203125, -1.858154296875, -1.72918701171875, -1.6002197265625, -1.47125244140625, -1.34228515625, -1.21331787109375, -1.0843505859375, -0.95538330078125, -0.826416015625, -0.69744873046875, -0.5684814453125, -0.43951416015625, -0.310546875, -0.18157958984375, -0.0526123046875, 0.07635498046875, 0.205322265625, 0.33428955078125, 0.4632568359375, 0.59222412109375, 0.72119140625, 0.85015869140625, 0.9791259765625, 1.10809326171875, 1.237060546875, 1.36602783203125, 1.4949951171875, 1.62396240234375, 1.7529296875, 1.88189697265625, 2.0108642578125, 2.13983154296875, 2.268798828125, 2.39776611328125, 2.5267333984375, 2.65570068359375, 2.78466796875, 2.91363525390625, 3.0426025390625, 3.17156982421875, 3.300537109375, 3.42950439453125, 3.5584716796875, 3.68743896484375, 3.81640625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 2.0, 3.0, 10.0, 8.0, 21.0, 14.0, 25.0, 39.0, 47.0, 53.0, 81.0, 112.0, 185.0, 272.0, 359.0, 693.0, 1253.0, 2486.0, 5509.0, 13584.0, 38162.0, 122196.0, 356882.0, 336861.0, 111339.0, 35212.0, 12682.0, 5061.0, 2329.0, 1232.0, 636.0, 411.0, 251.0, 151.0, 114.0, 65.0, 52.0, 40.0, 29.0, 28.0, 20.0, 11.0, 9.0, 11.0, 5.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.078125, -25.26220703125, -24.4462890625, -23.63037109375, -22.814453125, -21.99853515625, -21.1826171875, -20.36669921875, -19.55078125, -18.73486328125, -17.9189453125, -17.10302734375, -16.287109375, -15.47119140625, -14.6552734375, -13.83935546875, -13.0234375, -12.20751953125, -11.3916015625, -10.57568359375, -9.759765625, -8.94384765625, -8.1279296875, -7.31201171875, -6.49609375, -5.68017578125, -4.8642578125, -4.04833984375, -3.232421875, -2.41650390625, -1.6005859375, -0.78466796875, 0.03125, 0.84716796875, 1.6630859375, 2.47900390625, 3.294921875, 4.11083984375, 4.9267578125, 5.74267578125, 6.55859375, 7.37451171875, 8.1904296875, 9.00634765625, 9.822265625, 10.63818359375, 11.4541015625, 12.27001953125, 13.0859375, 13.90185546875, 14.7177734375, 15.53369140625, 16.349609375, 17.16552734375, 17.9814453125, 18.79736328125, 19.61328125, 20.42919921875, 21.2451171875, 22.06103515625, 22.876953125, 23.69287109375, 24.5087890625, 25.32470703125, 26.140625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 9.0, 13.0, 14.0, 16.0, 23.0, 13.0, 11.0, 28.0, 16.0, 29.0, 32.0, 43.0, 41.0, 39.0, 54.0, 48.0, 54.0, 45.0, 49.0, 49.0, 39.0, 48.0, 54.0, 50.0, 32.0, 18.0, 25.0, 25.0, 19.0, 23.0, 8.0, 5.0, 6.0, 9.0, 2.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-22.125, -21.43701171875, -20.7490234375, -20.06103515625, -19.373046875, -18.68505859375, -17.9970703125, -17.30908203125, -16.62109375, -15.93310546875, -15.2451171875, -14.55712890625, -13.869140625, -13.18115234375, -12.4931640625, -11.80517578125, -11.1171875, -10.42919921875, -9.7412109375, -9.05322265625, -8.365234375, -7.67724609375, -6.9892578125, -6.30126953125, -5.61328125, -4.92529296875, -4.2373046875, -3.54931640625, -2.861328125, -2.17333984375, -1.4853515625, -0.79736328125, -0.109375, 0.57861328125, 1.2666015625, 1.95458984375, 2.642578125, 3.33056640625, 4.0185546875, 4.70654296875, 5.39453125, 6.08251953125, 6.7705078125, 7.45849609375, 8.146484375, 8.83447265625, 9.5224609375, 10.21044921875, 10.8984375, 11.58642578125, 12.2744140625, 12.96240234375, 13.650390625, 14.33837890625, 15.0263671875, 15.71435546875, 16.40234375, 17.09033203125, 17.7783203125, 18.46630859375, 19.154296875, 19.84228515625, 20.5302734375, 21.21826171875, 21.90625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 12.0, 15.0, 18.0, 27.0, 51.0, 65.0, 119.0, 278.0, 908.0, 4251.0, 45244.0, 887800.0, 101199.0, 6645.0, 1237.0, 354.0, 115.0, 86.0, 44.0, 24.0, 24.0, 15.0, 11.0, 6.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.125, -48.6337890625, -47.142578125, -45.6513671875, -44.16015625, -42.6689453125, -41.177734375, -39.6865234375, -38.1953125, -36.7041015625, -35.212890625, -33.7216796875, -32.23046875, -30.7392578125, -29.248046875, -27.7568359375, -26.265625, -24.7744140625, -23.283203125, -21.7919921875, -20.30078125, -18.8095703125, -17.318359375, -15.8271484375, -14.3359375, -12.8447265625, -11.353515625, -9.8623046875, -8.37109375, -6.8798828125, -5.388671875, -3.8974609375, -2.40625, -0.9150390625, 0.576171875, 2.0673828125, 3.55859375, 5.0498046875, 6.541015625, 8.0322265625, 9.5234375, 11.0146484375, 12.505859375, 13.9970703125, 15.48828125, 16.9794921875, 18.470703125, 19.9619140625, 21.453125, 22.9443359375, 24.435546875, 25.9267578125, 27.41796875, 28.9091796875, 30.400390625, 31.8916015625, 33.3828125, 34.8740234375, 36.365234375, 37.8564453125, 39.34765625, 40.8388671875, 42.330078125, 43.8212890625, 45.3125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 10.0, 4.0, 10.0, 12.0, 15.0, 27.0, 34.0, 33.0, 55.0, 74.0, 73.0, 87.0, 76.0, 93.0, 98.0, 64.0, 50.0, 39.0, 32.0, 20.0, 12.0, 12.0, 16.0, 9.0, 8.0, 5.0, 6.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0019168853759765625, -0.0018523037433624268, -0.001787722110748291, -0.0017231404781341553, -0.0016585588455200195, -0.0015939772129058838, -0.001529395580291748, -0.0014648139476776123, -0.0014002323150634766, -0.0013356506824493408, -0.001271069049835205, -0.0012064874172210693, -0.0011419057846069336, -0.0010773241519927979, -0.0010127425193786621, -0.0009481608867645264, -0.0008835792541503906, -0.0008189976215362549, -0.0007544159889221191, -0.0006898343563079834, -0.0006252527236938477, -0.0005606710910797119, -0.0004960894584655762, -0.00043150782585144043, -0.0003669261932373047, -0.00030234456062316895, -0.0002377629280090332, -0.00017318129539489746, -0.00010859966278076172, -4.4018030166625977e-05, 2.0563602447509766e-05, 8.514523506164551e-05, 0.00014972686767578125, 0.000214308500289917, 0.00027889013290405273, 0.0003434717655181885, 0.0004080533981323242, 0.00047263503074645996, 0.0005372166633605957, 0.0006017982959747314, 0.0006663799285888672, 0.0007309615612030029, 0.0007955431938171387, 0.0008601248264312744, 0.0009247064590454102, 0.000989288091659546, 0.0010538697242736816, 0.0011184513568878174, 0.0011830329895019531, 0.0012476146221160889, 0.0013121962547302246, 0.0013767778873443604, 0.001441359519958496, 0.0015059411525726318, 0.0015705227851867676, 0.0016351044178009033, 0.001699686050415039, 0.0017642676830291748, 0.0018288493156433105, 0.0018934309482574463, 0.001958012580871582, 0.0020225942134857178, 0.0020871758460998535, 0.0021517574787139893, 0.002216339111328125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 6.0, 4.0, 8.0, 4.0, 6.0, 5.0, 12.0, 13.0, 25.0, 25.0, 50.0, 78.0, 98.0, 173.0, 389.0, 810.0, 1786.0, 4790.0, 26818.0, 611316.0, 377061.0, 18164.0, 3959.0, 1464.0, 666.0, 332.0, 180.0, 93.0, 59.0, 42.0, 26.0, 16.0, 14.0, 8.0, 7.0, 5.0, 2.0, 5.0, 6.0, 6.0, 4.0, 4.0, 1.0, 3.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.96875, -31.86669921875, -30.7646484375, -29.66259765625, -28.560546875, -27.45849609375, -26.3564453125, -25.25439453125, -24.15234375, -23.05029296875, -21.9482421875, -20.84619140625, -19.744140625, -18.64208984375, -17.5400390625, -16.43798828125, -15.3359375, -14.23388671875, -13.1318359375, -12.02978515625, -10.927734375, -9.82568359375, -8.7236328125, -7.62158203125, -6.51953125, -5.41748046875, -4.3154296875, -3.21337890625, -2.111328125, -1.00927734375, 0.0927734375, 1.19482421875, 2.296875, 3.39892578125, 4.5009765625, 5.60302734375, 6.705078125, 7.80712890625, 8.9091796875, 10.01123046875, 11.11328125, 12.21533203125, 13.3173828125, 14.41943359375, 15.521484375, 16.62353515625, 17.7255859375, 18.82763671875, 19.9296875, 21.03173828125, 22.1337890625, 23.23583984375, 24.337890625, 25.43994140625, 26.5419921875, 27.64404296875, 28.74609375, 29.84814453125, 30.9501953125, 32.05224609375, 33.154296875, 34.25634765625, 35.3583984375, 36.46044921875, 37.5625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 3.0, 8.0, 7.0, 13.0, 19.0, 41.0, 47.0, 90.0, 124.0, 153.0, 157.0, 103.0, 73.0, 52.0, 41.0, 19.0, 13.0, 7.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.46875, -36.29833984375, -35.1279296875, -33.95751953125, -32.787109375, -31.61669921875, -30.4462890625, -29.27587890625, -28.10546875, -26.93505859375, -25.7646484375, -24.59423828125, -23.423828125, -22.25341796875, -21.0830078125, -19.91259765625, -18.7421875, -17.57177734375, -16.4013671875, -15.23095703125, -14.060546875, -12.89013671875, -11.7197265625, -10.54931640625, -9.37890625, -8.20849609375, -7.0380859375, -5.86767578125, -4.697265625, -3.52685546875, -2.3564453125, -1.18603515625, -0.015625, 1.15478515625, 2.3251953125, 3.49560546875, 4.666015625, 5.83642578125, 7.0068359375, 8.17724609375, 9.34765625, 10.51806640625, 11.6884765625, 12.85888671875, 14.029296875, 15.19970703125, 16.3701171875, 17.54052734375, 18.7109375, 19.88134765625, 21.0517578125, 22.22216796875, 23.392578125, 24.56298828125, 25.7333984375, 26.90380859375, 28.07421875, 29.24462890625, 30.4150390625, 31.58544921875, 32.755859375, 33.92626953125, 35.0966796875, 36.26708984375, 37.4375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 16.0, 38.0, 179.0, 428.0, 264.0, 69.0, 10.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-956.5154418945312, -927.1532592773438, -897.7910766601562, -868.4288940429688, -839.0667114257812, -809.7045288085938, -780.34228515625, -750.9801025390625, -721.617919921875, -692.2557373046875, -662.8935546875, -633.5313720703125, -604.169189453125, -574.8070068359375, -545.44482421875, -516.0826416015625, -486.720458984375, -457.3582763671875, -427.99609375, -398.6339111328125, -369.271728515625, -339.9095458984375, -310.5473327636719, -281.1851501464844, -251.82296752929688, -222.46078491210938, -193.09860229492188, -163.7364044189453, -134.3742218017578, -105.01203918457031, -75.64984130859375, -46.28765869140625, -16.9254150390625, 12.436771392822266, 41.79895782470703, 71.16114807128906, 100.52333068847656, 129.88551330566406, 159.24771118164062, 188.60989379882812, 217.97207641601562, 247.33425903320312, 276.6964416503906, 306.05865478515625, 335.42083740234375, 364.78302001953125, 394.14520263671875, 423.50738525390625, 452.86956787109375, 482.23175048828125, 511.59393310546875, 540.9561157226562, 570.3182983398438, 599.6804809570312, 629.042724609375, 658.4049072265625, 687.76708984375, 717.1292724609375, 746.491455078125, 775.8536376953125, 805.2158203125, 834.5780029296875, 863.940185546875, 893.3023681640625, 922.66455078125]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 5.0, 10.0, 9.0, 10.0, 6.0, 9.0, 22.0, 17.0, 21.0, 20.0, 30.0, 42.0, 38.0, 42.0, 53.0, 35.0, 55.0, 54.0, 68.0, 52.0, 46.0, 50.0, 49.0, 48.0, 40.0, 23.0, 29.0, 28.0, 23.0, 23.0, 9.0, 12.0, 9.0, 7.0, 4.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-109.92018127441406, -105.06048583984375, -100.20079040527344, -95.34110260009766, -90.48140716552734, -85.62171173095703, -80.76202392578125, -75.90232849121094, -71.04263305664062, -66.18293762207031, -61.323246002197266, -56.46355438232422, -51.603858947753906, -46.744163513183594, -41.88447189331055, -37.0247802734375, -32.16508483886719, -27.305391311645508, -22.445697784423828, -17.58600425720215, -12.726310729980469, -7.866617202758789, -3.0069236755371094, 1.8527679443359375, 6.71246337890625, 11.57215690612793, 16.43185043334961, 21.29154396057129, 26.15123748779297, 31.01093101501465, 35.87062454223633, 40.730316162109375, 45.59002685546875, 50.44972229003906, 55.30941390991211, 60.169105529785156, 65.02880096435547, 69.88849639892578, 74.74818420410156, 79.60787963867188, 84.46757507324219, 89.3272705078125, 94.18696594238281, 99.0466537475586, 103.9063491821289, 108.76604461669922, 113.625732421875, 118.48542785644531, 123.34512329101562, 128.20481872558594, 133.06451416015625, 137.92420959472656, 142.78390502929688, 147.64358520507812, 152.50328063964844, 157.36297607421875, 162.22267150878906, 167.08236694335938, 171.9420623779297, 176.8017578125, 181.66143798828125, 186.52113342285156, 191.38082885742188, 196.2405242919922, 201.1002197265625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 8.0, 9.0, 8.0, 34.0, 41.0, 70.0, 100.0, 187.0, 317.0, 613.0, 1603.0, 6527.0, 137633.0, 4036089.0, 7708.0, 1815.0, 667.0, 349.0, 195.0, 98.0, 70.0, 40.0, 29.0, 16.0, 18.0, 3.0, 9.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.3125, -96.3076171875, -93.302734375, -90.2978515625, -87.29296875, -84.2880859375, -81.283203125, -78.2783203125, -75.2734375, -72.2685546875, -69.263671875, -66.2587890625, -63.25390625, -60.2490234375, -57.244140625, -54.2392578125, -51.234375, -48.2294921875, -45.224609375, -42.2197265625, -39.21484375, -36.2099609375, -33.205078125, -30.2001953125, -27.1953125, -24.1904296875, -21.185546875, -18.1806640625, -15.17578125, -12.1708984375, -9.166015625, -6.1611328125, -3.15625, -0.1513671875, 2.853515625, 5.8583984375, 8.86328125, 11.8681640625, 14.873046875, 17.8779296875, 20.8828125, 23.8876953125, 26.892578125, 29.8974609375, 32.90234375, 35.9072265625, 38.912109375, 41.9169921875, 44.921875, 47.9267578125, 50.931640625, 53.9365234375, 56.94140625, 59.9462890625, 62.951171875, 65.9560546875, 68.9609375, 71.9658203125, 74.970703125, 77.9755859375, 80.98046875, 83.9853515625, 86.990234375, 89.9951171875, 93.0]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 10.0, 6.0, 15.0, 19.0, 20.0, 39.0, 33.0, 36.0, 42.0, 64.0, 59.0, 65.0, 59.0, 66.0, 65.0, 79.0, 60.0, 54.0, 46.0, 36.0, 35.0, 17.0, 20.0, 14.0, 7.0, 9.0, 8.0, 1.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.91015625, -7.686279296875, -7.46240234375, -7.238525390625, -7.0146484375, -6.790771484375, -6.56689453125, -6.343017578125, -6.119140625, -5.895263671875, -5.67138671875, -5.447509765625, -5.2236328125, -4.999755859375, -4.77587890625, -4.552001953125, -4.328125, -4.104248046875, -3.88037109375, -3.656494140625, -3.4326171875, -3.208740234375, -2.98486328125, -2.760986328125, -2.537109375, -2.313232421875, -2.08935546875, -1.865478515625, -1.6416015625, -1.417724609375, -1.19384765625, -0.969970703125, -0.74609375, -0.522216796875, -0.29833984375, -0.074462890625, 0.1494140625, 0.373291015625, 0.59716796875, 0.821044921875, 1.044921875, 1.268798828125, 1.49267578125, 1.716552734375, 1.9404296875, 2.164306640625, 2.38818359375, 2.612060546875, 2.8359375, 3.059814453125, 3.28369140625, 3.507568359375, 3.7314453125, 3.955322265625, 4.17919921875, 4.403076171875, 4.626953125, 4.850830078125, 5.07470703125, 5.298583984375, 5.5224609375, 5.746337890625, 5.97021484375, 6.194091796875, 6.41796875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 6.0, 6.0, 7.0, 7.0, 16.0, 24.0, 18.0, 40.0, 52.0, 73.0, 72.0, 128.0, 154.0, 225.0, 308.0, 377.0, 605.0, 895.0, 1508.0, 2457.0, 4793.0, 11292.0, 35380.0, 3891736.0, 197795.0, 26532.0, 9402.0, 4077.0, 2113.0, 1356.0, 848.0, 542.0, 390.0, 276.0, 228.0, 124.0, 112.0, 79.0, 62.0, 38.0, 33.0, 32.0, 14.0, 22.0, 12.0, 8.0, 1.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-37.96875, -36.7783203125, -35.587890625, -34.3974609375, -33.20703125, -32.0166015625, -30.826171875, -29.6357421875, -28.4453125, -27.2548828125, -26.064453125, -24.8740234375, -23.68359375, -22.4931640625, -21.302734375, -20.1123046875, -18.921875, -17.7314453125, -16.541015625, -15.3505859375, -14.16015625, -12.9697265625, -11.779296875, -10.5888671875, -9.3984375, -8.2080078125, -7.017578125, -5.8271484375, -4.63671875, -3.4462890625, -2.255859375, -1.0654296875, 0.125, 1.3154296875, 2.505859375, 3.6962890625, 4.88671875, 6.0771484375, 7.267578125, 8.4580078125, 9.6484375, 10.8388671875, 12.029296875, 13.2197265625, 14.41015625, 15.6005859375, 16.791015625, 17.9814453125, 19.171875, 20.3623046875, 21.552734375, 22.7431640625, 23.93359375, 25.1240234375, 26.314453125, 27.5048828125, 28.6953125, 29.8857421875, 31.076171875, 32.2666015625, 33.45703125, 34.6474609375, 35.837890625, 37.0283203125, 38.21875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 2.0, 4.0, 4.0, 5.0, 11.0, 12.0, 22.0, 31.0, 61.0, 234.0, 3519.0, 66.0, 24.0, 21.0, 17.0, 13.0, 6.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.09375, -10.7686767578125, -10.443603515625, -10.1185302734375, -9.79345703125, -9.4683837890625, -9.143310546875, -8.8182373046875, -8.4931640625, -8.1680908203125, -7.843017578125, -7.5179443359375, -7.19287109375, -6.8677978515625, -6.542724609375, -6.2176513671875, -5.892578125, -5.5675048828125, -5.242431640625, -4.9173583984375, -4.59228515625, -4.2672119140625, -3.942138671875, -3.6170654296875, -3.2919921875, -2.9669189453125, -2.641845703125, -2.3167724609375, -1.99169921875, -1.6666259765625, -1.341552734375, -1.0164794921875, -0.69140625, -0.3663330078125, -0.041259765625, 0.2838134765625, 0.60888671875, 0.9339599609375, 1.259033203125, 1.5841064453125, 1.9091796875, 2.2342529296875, 2.559326171875, 2.8843994140625, 3.20947265625, 3.5345458984375, 3.859619140625, 4.1846923828125, 4.509765625, 4.8348388671875, 5.159912109375, 5.4849853515625, 5.81005859375, 6.1351318359375, 6.460205078125, 6.7852783203125, 7.1103515625, 7.4354248046875, 7.760498046875, 8.0855712890625, 8.41064453125, 8.7357177734375, 9.060791015625, 9.3858642578125, 9.7109375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 6.0, 5.0, 3.0, 9.0, 8.0, 17.0, 20.0, 34.0, 62.0, 83.0, 114.0, 115.0, 114.0, 100.0, 99.0, 67.0, 54.0, 39.0, 18.0, 12.0, 9.0, 4.0, 2.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.999881744384766, -36.984230041503906, -35.96858215332031, -34.95293426513672, -33.93728256225586, -32.921630859375, -31.905982971191406, -30.89033317565918, -29.874683380126953, -28.859033584594727, -27.8433837890625, -26.827733993530273, -25.812084197998047, -24.79643440246582, -23.780784606933594, -22.765134811401367, -21.74948501586914, -20.733835220336914, -19.718185424804688, -18.70253562927246, -17.686885833740234, -16.671236038208008, -15.655586242675781, -14.639936447143555, -13.624286651611328, -12.608636856079102, -11.592987060546875, -10.577337265014648, -9.561687469482422, -8.546037673950195, -7.530387878417969, -6.514738082885742, -5.49908447265625, -4.483434677124023, -3.467784881591797, -2.4521350860595703, -1.4364852905273438, -0.4208354949951172, 0.5948143005371094, 1.610464096069336, 2.6261138916015625, 3.641763687133789, 4.657413482666016, 5.673063278198242, 6.688713073730469, 7.704362869262695, 8.720012664794922, 9.735662460327148, 10.751312255859375, 11.766962051391602, 12.782611846923828, 13.798261642456055, 14.813911437988281, 15.829561233520508, 16.845211029052734, 17.86086082458496, 18.876510620117188, 19.892160415649414, 20.90781021118164, 21.923460006713867, 22.939109802246094, 23.95475959777832, 24.970409393310547, 25.986059188842773, 27.001708984375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 6.0, 15.0, 16.0, 20.0, 21.0, 28.0, 31.0, 39.0, 43.0, 52.0, 64.0, 54.0, 64.0, 58.0, 60.0, 62.0, 49.0, 52.0, 50.0, 56.0, 31.0, 31.0, 23.0, 19.0, 17.0, 14.0, 11.0, 7.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.184345245361328, -17.447647094726562, -16.710947036743164, -15.974248886108398, -15.237549781799316, -14.500850677490234, -13.764152526855469, -13.027453422546387, -12.290754318237305, -11.554055213928223, -10.81735610961914, -10.080657958984375, -9.343958854675293, -8.607259750366211, -7.870561122894287, -7.133862495422363, -6.397163391113281, -5.660464286804199, -4.923765659332275, -4.187067031860352, -3.4503679275512695, -2.7136690616607666, -1.9769701957702637, -1.2402715682983398, -0.5035724639892578, 0.23312640190124512, 0.969825267791748, 1.706524133682251, 2.443222999572754, 3.179921865463257, 3.9166207313537598, 4.653319358825684, 5.390018463134766, 6.126717567443848, 6.8634161949157715, 7.600114822387695, 8.336813926696777, 9.07351303100586, 9.810211181640625, 10.546910285949707, 11.283609390258789, 12.020308494567871, 12.757007598876953, 13.493705749511719, 14.2304048538208, 14.967103958129883, 15.703802108764648, 16.440502166748047, 17.177200317382812, 17.913898468017578, 18.650598526000977, 19.387296676635742, 20.12399673461914, 20.860694885253906, 21.597393035888672, 22.334091186523438, 23.070791244506836, 23.8074893951416, 24.544189453125, 25.280887603759766, 26.01758575439453, 26.75428581237793, 27.490983963012695, 28.227684020996094, 28.96438217163086]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 10.0, 14.0, 16.0, 19.0, 40.0, 46.0, 74.0, 130.0, 185.0, 295.0, 481.0, 796.0, 1423.0, 2720.0, 5479.0, 11318.0, 24546.0, 55808.0, 127239.0, 242969.0, 274742.0, 163542.0, 74662.0, 32829.0, 14613.0, 6844.0, 3466.0, 1772.0, 983.0, 553.0, 335.0, 211.0, 130.0, 83.0, 60.0, 32.0, 34.0, 15.0, 12.0, 13.0, 3.0, 3.0, 4.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.859375, -23.1611328125, -22.462890625, -21.7646484375, -21.06640625, -20.3681640625, -19.669921875, -18.9716796875, -18.2734375, -17.5751953125, -16.876953125, -16.1787109375, -15.48046875, -14.7822265625, -14.083984375, -13.3857421875, -12.6875, -11.9892578125, -11.291015625, -10.5927734375, -9.89453125, -9.1962890625, -8.498046875, -7.7998046875, -7.1015625, -6.4033203125, -5.705078125, -5.0068359375, -4.30859375, -3.6103515625, -2.912109375, -2.2138671875, -1.515625, -0.8173828125, -0.119140625, 0.5791015625, 1.27734375, 1.9755859375, 2.673828125, 3.3720703125, 4.0703125, 4.7685546875, 5.466796875, 6.1650390625, 6.86328125, 7.5615234375, 8.259765625, 8.9580078125, 9.65625, 10.3544921875, 11.052734375, 11.7509765625, 12.44921875, 13.1474609375, 13.845703125, 14.5439453125, 15.2421875, 15.9404296875, 16.638671875, 17.3369140625, 18.03515625, 18.7333984375, 19.431640625, 20.1298828125, 20.828125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 6.0, 5.0, 12.0, 15.0, 11.0, 22.0, 30.0, 29.0, 28.0, 36.0, 51.0, 55.0, 46.0, 54.0, 53.0, 54.0, 71.0, 56.0, 60.0, 53.0, 56.0, 36.0, 39.0, 32.0, 17.0, 19.0, 13.0, 13.0, 8.0, 4.0, 4.0, 5.0, 2.0, 3.0, 5.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.390625, -8.15557861328125, -7.9205322265625, -7.68548583984375, -7.450439453125, -7.21539306640625, -6.9803466796875, -6.74530029296875, -6.51025390625, -6.27520751953125, -6.0401611328125, -5.80511474609375, -5.570068359375, -5.33502197265625, -5.0999755859375, -4.86492919921875, -4.6298828125, -4.39483642578125, -4.1597900390625, -3.92474365234375, -3.689697265625, -3.45465087890625, -3.2196044921875, -2.98455810546875, -2.74951171875, -2.51446533203125, -2.2794189453125, -2.04437255859375, -1.809326171875, -1.57427978515625, -1.3392333984375, -1.10418701171875, -0.869140625, -0.63409423828125, -0.3990478515625, -0.16400146484375, 0.071044921875, 0.30609130859375, 0.5411376953125, 0.77618408203125, 1.01123046875, 1.24627685546875, 1.4813232421875, 1.71636962890625, 1.951416015625, 2.18646240234375, 2.4215087890625, 2.65655517578125, 2.8916015625, 3.12664794921875, 3.3616943359375, 3.59674072265625, 3.831787109375, 4.06683349609375, 4.3018798828125, 4.53692626953125, 4.77197265625, 5.00701904296875, 5.2420654296875, 5.47711181640625, 5.712158203125, 5.94720458984375, 6.1822509765625, 6.41729736328125, 6.65234375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 7.0, 4.0, 5.0, 7.0, 10.0, 8.0, 9.0, 10.0, 29.0, 41.0, 64.0, 85.0, 149.0, 236.0, 398.0, 776.0, 1910.0, 7326.0, 45833.0, 411683.0, 508316.0, 58674.0, 8873.0, 2204.0, 804.0, 436.0, 237.0, 160.0, 69.0, 61.0, 31.0, 25.0, 14.0, 19.0, 9.0, 6.0, 9.0, 5.0, 4.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.25, -52.31640625, -50.3828125, -48.44921875, -46.515625, -44.58203125, -42.6484375, -40.71484375, -38.78125, -36.84765625, -34.9140625, -32.98046875, -31.046875, -29.11328125, -27.1796875, -25.24609375, -23.3125, -21.37890625, -19.4453125, -17.51171875, -15.578125, -13.64453125, -11.7109375, -9.77734375, -7.84375, -5.91015625, -3.9765625, -2.04296875, -0.109375, 1.82421875, 3.7578125, 5.69140625, 7.625, 9.55859375, 11.4921875, 13.42578125, 15.359375, 17.29296875, 19.2265625, 21.16015625, 23.09375, 25.02734375, 26.9609375, 28.89453125, 30.828125, 32.76171875, 34.6953125, 36.62890625, 38.5625, 40.49609375, 42.4296875, 44.36328125, 46.296875, 48.23046875, 50.1640625, 52.09765625, 54.03125, 55.96484375, 57.8984375, 59.83203125, 61.765625, 63.69921875, 65.6328125, 67.56640625, 69.5]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 4.0, 3.0, 2.0, 6.0, 9.0, 7.0, 8.0, 7.0, 16.0, 16.0, 18.0, 18.0, 25.0, 22.0, 44.0, 41.0, 31.0, 28.0, 66.0, 36.0, 40.0, 55.0, 51.0, 39.0, 35.0, 46.0, 43.0, 28.0, 24.0, 30.0, 28.0, 25.0, 27.0, 24.0, 15.0, 16.0, 15.0, 4.0, 6.0, 9.0, 9.0, 3.0, 5.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-33.59375, -32.5888671875, -31.583984375, -30.5791015625, -29.57421875, -28.5693359375, -27.564453125, -26.5595703125, -25.5546875, -24.5498046875, -23.544921875, -22.5400390625, -21.53515625, -20.5302734375, -19.525390625, -18.5205078125, -17.515625, -16.5107421875, -15.505859375, -14.5009765625, -13.49609375, -12.4912109375, -11.486328125, -10.4814453125, -9.4765625, -8.4716796875, -7.466796875, -6.4619140625, -5.45703125, -4.4521484375, -3.447265625, -2.4423828125, -1.4375, -0.4326171875, 0.572265625, 1.5771484375, 2.58203125, 3.5869140625, 4.591796875, 5.5966796875, 6.6015625, 7.6064453125, 8.611328125, 9.6162109375, 10.62109375, 11.6259765625, 12.630859375, 13.6357421875, 14.640625, 15.6455078125, 16.650390625, 17.6552734375, 18.66015625, 19.6650390625, 20.669921875, 21.6748046875, 22.6796875, 23.6845703125, 24.689453125, 25.6943359375, 26.69921875, 27.7041015625, 28.708984375, 29.7138671875, 30.71875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 3.0, 4.0, 2.0, 5.0, 4.0, 8.0, 20.0, 17.0, 29.0, 38.0, 40.0, 65.0, 103.0, 143.0, 226.0, 333.0, 550.0, 976.0, 1771.0, 3527.0, 8018.0, 22748.0, 83805.0, 387385.0, 410315.0, 88307.0, 23601.0, 8370.0, 3573.0, 1857.0, 1021.0, 614.0, 347.0, 241.0, 141.0, 106.0, 64.0, 51.0, 37.0, 22.0, 27.0, 11.0, 6.0, 8.0, 2.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-19.234375, -18.6689453125, -18.103515625, -17.5380859375, -16.97265625, -16.4072265625, -15.841796875, -15.2763671875, -14.7109375, -14.1455078125, -13.580078125, -13.0146484375, -12.44921875, -11.8837890625, -11.318359375, -10.7529296875, -10.1875, -9.6220703125, -9.056640625, -8.4912109375, -7.92578125, -7.3603515625, -6.794921875, -6.2294921875, -5.6640625, -5.0986328125, -4.533203125, -3.9677734375, -3.40234375, -2.8369140625, -2.271484375, -1.7060546875, -1.140625, -0.5751953125, -0.009765625, 0.5556640625, 1.12109375, 1.6865234375, 2.251953125, 2.8173828125, 3.3828125, 3.9482421875, 4.513671875, 5.0791015625, 5.64453125, 6.2099609375, 6.775390625, 7.3408203125, 7.90625, 8.4716796875, 9.037109375, 9.6025390625, 10.16796875, 10.7333984375, 11.298828125, 11.8642578125, 12.4296875, 12.9951171875, 13.560546875, 14.1259765625, 14.69140625, 15.2568359375, 15.822265625, 16.3876953125, 16.953125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 6.0, 8.0, 11.0, 21.0, 46.0, 68.0, 183.0, 217.0, 202.0, 122.0, 55.0, 32.0, 18.0, 11.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00518035888671875, -0.00496220588684082, -0.004744052886962891, -0.004525899887084961, -0.004307746887207031, -0.0040895938873291016, -0.003871440887451172, -0.003653287887573242, -0.0034351348876953125, -0.003216981887817383, -0.002998828887939453, -0.0027806758880615234, -0.0025625228881835938, -0.002344369888305664, -0.0021262168884277344, -0.0019080638885498047, -0.001689910888671875, -0.0014717578887939453, -0.0012536048889160156, -0.001035451889038086, -0.0008172988891601562, -0.0005991458892822266, -0.0003809928894042969, -0.0001628398895263672, 5.53131103515625e-05, 0.0002734661102294922, 0.0004916191101074219, 0.0007097721099853516, 0.0009279251098632812, 0.001146078109741211, 0.0013642311096191406, 0.0015823841094970703, 0.001800537109375, 0.0020186901092529297, 0.0022368431091308594, 0.002454996109008789, 0.0026731491088867188, 0.0028913021087646484, 0.003109455108642578, 0.003327608108520508, 0.0035457611083984375, 0.003763914108276367, 0.003982067108154297, 0.0042002201080322266, 0.004418373107910156, 0.004636526107788086, 0.004854679107666016, 0.005072832107543945, 0.005290985107421875, 0.005509138107299805, 0.005727291107177734, 0.005945444107055664, 0.006163597106933594, 0.0063817501068115234, 0.006599903106689453, 0.006818056106567383, 0.0070362091064453125, 0.007254362106323242, 0.007472515106201172, 0.0076906681060791016, 0.007908821105957031, 0.008126974105834961, 0.00834512710571289, 0.00856328010559082, 0.00878143310546875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 3.0, 8.0, 7.0, 14.0, 19.0, 25.0, 35.0, 68.0, 104.0, 151.0, 250.0, 466.0, 1038.0, 3514.0, 22887.0, 368880.0, 606128.0, 37632.0, 4666.0, 1332.0, 545.0, 312.0, 167.0, 91.0, 78.0, 52.0, 30.0, 17.0, 14.0, 7.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.078125, -29.078857421875, -28.07958984375, -27.080322265625, -26.0810546875, -25.081787109375, -24.08251953125, -23.083251953125, -22.083984375, -21.084716796875, -20.08544921875, -19.086181640625, -18.0869140625, -17.087646484375, -16.08837890625, -15.089111328125, -14.08984375, -13.090576171875, -12.09130859375, -11.092041015625, -10.0927734375, -9.093505859375, -8.09423828125, -7.094970703125, -6.095703125, -5.096435546875, -4.09716796875, -3.097900390625, -2.0986328125, -1.099365234375, -0.10009765625, 0.899169921875, 1.8984375, 2.897705078125, 3.89697265625, 4.896240234375, 5.8955078125, 6.894775390625, 7.89404296875, 8.893310546875, 9.892578125, 10.891845703125, 11.89111328125, 12.890380859375, 13.8896484375, 14.888916015625, 15.88818359375, 16.887451171875, 17.88671875, 18.885986328125, 19.88525390625, 20.884521484375, 21.8837890625, 22.883056640625, 23.88232421875, 24.881591796875, 25.880859375, 26.880126953125, 27.87939453125, 28.878662109375, 29.8779296875, 30.877197265625, 31.87646484375, 32.875732421875, 33.875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 5.0, 13.0, 4.0, 12.0, 13.0, 13.0, 23.0, 16.0, 28.0, 43.0, 38.0, 42.0, 60.0, 75.0, 72.0, 85.0, 95.0, 69.0, 51.0, 54.0, 36.0, 31.0, 25.0, 24.0, 15.0, 16.0, 16.0, 10.0, 10.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.9375, -17.228759765625, -16.52001953125, -15.811279296875, -15.1025390625, -14.393798828125, -13.68505859375, -12.976318359375, -12.267578125, -11.558837890625, -10.85009765625, -10.141357421875, -9.4326171875, -8.723876953125, -8.01513671875, -7.306396484375, -6.59765625, -5.888916015625, -5.18017578125, -4.471435546875, -3.7626953125, -3.053955078125, -2.34521484375, -1.636474609375, -0.927734375, -0.218994140625, 0.48974609375, 1.198486328125, 1.9072265625, 2.615966796875, 3.32470703125, 4.033447265625, 4.7421875, 5.450927734375, 6.15966796875, 6.868408203125, 7.5771484375, 8.285888671875, 8.99462890625, 9.703369140625, 10.412109375, 11.120849609375, 11.82958984375, 12.538330078125, 13.2470703125, 13.955810546875, 14.66455078125, 15.373291015625, 16.08203125, 16.790771484375, 17.49951171875, 18.208251953125, 18.9169921875, 19.625732421875, 20.33447265625, 21.043212890625, 21.751953125, 22.460693359375, 23.16943359375, 23.878173828125, 24.5869140625, 25.295654296875, 26.00439453125, 26.713134765625, 27.421875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 10.0, 17.0, 48.0, 84.0, 163.0, 203.0, 188.0, 132.0, 81.0, 44.0, 21.0, 10.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-413.8857421875, -398.4674072265625, -383.049072265625, -367.6307067871094, -352.2123718261719, -336.7940368652344, -321.37567138671875, -305.95733642578125, -290.53900146484375, -275.12066650390625, -259.70233154296875, -244.28396606445312, -228.86563110351562, -213.44729614257812, -198.02894592285156, -182.610595703125, -167.1922607421875, -151.77392578125, -136.35557556152344, -120.9372329711914, -105.51889038085938, -90.10054779052734, -74.68220520019531, -59.26386260986328, -43.84552001953125, -28.42717742919922, -13.008834838867188, 2.4095077514648438, 17.827850341796875, 33.246192932128906, 48.66453552246094, 64.08287811279297, 79.501220703125, 94.91956329345703, 110.33790588378906, 125.7562484741211, 141.17459106445312, 156.59292602539062, 172.0112762451172, 187.42962646484375, 202.84796142578125, 218.26629638671875, 233.6846466064453, 249.10299682617188, 264.5213317871094, 279.9396667480469, 295.3580322265625, 310.7763671875, 326.1947021484375, 341.613037109375, 357.0313720703125, 372.4497375488281, 387.8680725097656, 403.2864074707031, 418.70477294921875, 434.12310791015625, 449.54144287109375, 464.95977783203125, 480.37811279296875, 495.7964782714844, 511.2148132324219, 526.6331787109375, 542.051513671875, 557.4698486328125, 572.88818359375]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 10.0, 7.0, 8.0, 10.0, 9.0, 15.0, 20.0, 22.0, 32.0, 20.0, 28.0, 35.0, 25.0, 25.0, 36.0, 35.0, 42.0, 49.0, 53.0, 41.0, 45.0, 45.0, 34.0, 36.0, 40.0, 38.0, 31.0, 25.0, 23.0, 21.0, 26.0, 18.0, 20.0, 17.0, 14.0, 8.0, 7.0, 6.0, 5.0, 6.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-164.18109130859375, -158.99493408203125, -153.80877685546875, -148.62261962890625, -143.43646240234375, -138.2503204345703, -133.0641632080078, -127.87800598144531, -122.69184875488281, -117.50569152832031, -112.31953430175781, -107.13338470458984, -101.94722747802734, -96.76107025146484, -91.57492065429688, -86.38876342773438, -81.20260620117188, -76.01644897460938, -70.83029174804688, -65.6441421508789, -60.457984924316406, -55.271827697753906, -50.08567428588867, -44.89952087402344, -39.71336364746094, -34.52720642089844, -29.341053009033203, -24.154897689819336, -18.96874237060547, -13.782587051391602, -8.596431732177734, -3.4102783203125, 1.7758636474609375, 6.962018966674805, 12.148174285888672, 17.33432960510254, 22.520484924316406, 27.706640243530273, 32.89279556274414, 38.078948974609375, 43.265106201171875, 48.451263427734375, 53.63741683959961, 58.823570251464844, 64.00972747802734, 69.19588470458984, 74.38203430175781, 79.56819152832031, 84.75434875488281, 89.94050598144531, 95.12666320800781, 100.31281280517578, 105.49897003173828, 110.68512725830078, 115.87127685546875, 121.05743408203125, 126.24359130859375, 131.42974853515625, 136.61590576171875, 141.80206298828125, 146.98822021484375, 152.1743621826172, 157.3605194091797, 162.5466766357422, 167.7328338623047]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 6.0, 3.0, 2.0, 5.0, 11.0, 35.0, 28.0, 55.0, 67.0, 109.0, 208.0, 528.0, 1605.0, 8685.0, 4060217.0, 114793.0, 5822.0, 1212.0, 447.0, 197.0, 81.0, 62.0, 25.0, 18.0, 23.0, 14.0, 4.0, 6.0, 8.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.8125, -84.548828125, -81.28515625, -78.021484375, -74.7578125, -71.494140625, -68.23046875, -64.966796875, -61.703125, -58.439453125, -55.17578125, -51.912109375, -48.6484375, -45.384765625, -42.12109375, -38.857421875, -35.59375, -32.330078125, -29.06640625, -25.802734375, -22.5390625, -19.275390625, -16.01171875, -12.748046875, -9.484375, -6.220703125, -2.95703125, 0.306640625, 3.5703125, 6.833984375, 10.09765625, 13.361328125, 16.625, 19.888671875, 23.15234375, 26.416015625, 29.6796875, 32.943359375, 36.20703125, 39.470703125, 42.734375, 45.998046875, 49.26171875, 52.525390625, 55.7890625, 59.052734375, 62.31640625, 65.580078125, 68.84375, 72.107421875, 75.37109375, 78.634765625, 81.8984375, 85.162109375, 88.42578125, 91.689453125, 94.953125, 98.216796875, 101.48046875, 104.744140625, 108.0078125, 111.271484375, 114.53515625, 117.798828125, 121.0625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 3.0, 4.0, 3.0, 13.0, 12.0, 15.0, 24.0, 30.0, 26.0, 46.0, 57.0, 54.0, 64.0, 72.0, 58.0, 62.0, 83.0, 64.0, 62.0, 51.0, 50.0, 20.0, 31.0, 25.0, 15.0, 13.0, 9.0, 9.0, 9.0, 4.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.4453125, -10.149169921875, -9.85302734375, -9.556884765625, -9.2607421875, -8.964599609375, -8.66845703125, -8.372314453125, -8.076171875, -7.780029296875, -7.48388671875, -7.187744140625, -6.8916015625, -6.595458984375, -6.29931640625, -6.003173828125, -5.70703125, -5.410888671875, -5.11474609375, -4.818603515625, -4.5224609375, -4.226318359375, -3.93017578125, -3.634033203125, -3.337890625, -3.041748046875, -2.74560546875, -2.449462890625, -2.1533203125, -1.857177734375, -1.56103515625, -1.264892578125, -0.96875, -0.672607421875, -0.37646484375, -0.080322265625, 0.2158203125, 0.511962890625, 0.80810546875, 1.104248046875, 1.400390625, 1.696533203125, 1.99267578125, 2.288818359375, 2.5849609375, 2.881103515625, 3.17724609375, 3.473388671875, 3.76953125, 4.065673828125, 4.36181640625, 4.657958984375, 4.9541015625, 5.250244140625, 5.54638671875, 5.842529296875, 6.138671875, 6.434814453125, 6.73095703125, 7.027099609375, 7.3232421875, 7.619384765625, 7.91552734375, 8.211669921875, 8.5078125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 3.0, 6.0, 5.0, 11.0, 12.0, 16.0, 21.0, 32.0, 53.0, 77.0, 139.0, 199.0, 351.0, 590.0, 1159.0, 2158.0, 4587.0, 10955.0, 30141.0, 176504.0, 3889963.0, 49423.0, 15257.0, 6289.0, 3021.0, 1460.0, 769.0, 414.0, 256.0, 147.0, 85.0, 50.0, 48.0, 14.0, 23.0, 12.0, 14.0, 11.0, 2.0, 2.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.9375, -42.65234375, -41.3671875, -40.08203125, -38.796875, -37.51171875, -36.2265625, -34.94140625, -33.65625, -32.37109375, -31.0859375, -29.80078125, -28.515625, -27.23046875, -25.9453125, -24.66015625, -23.375, -22.08984375, -20.8046875, -19.51953125, -18.234375, -16.94921875, -15.6640625, -14.37890625, -13.09375, -11.80859375, -10.5234375, -9.23828125, -7.953125, -6.66796875, -5.3828125, -4.09765625, -2.8125, -1.52734375, -0.2421875, 1.04296875, 2.328125, 3.61328125, 4.8984375, 6.18359375, 7.46875, 8.75390625, 10.0390625, 11.32421875, 12.609375, 13.89453125, 15.1796875, 16.46484375, 17.75, 19.03515625, 20.3203125, 21.60546875, 22.890625, 24.17578125, 25.4609375, 26.74609375, 28.03125, 29.31640625, 30.6015625, 31.88671875, 33.171875, 34.45703125, 35.7421875, 37.02734375, 38.3125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 6.0, 8.0, 16.0, 9.0, 18.0, 21.0, 24.0, 46.0, 76.0, 282.0, 3305.0, 87.0, 51.0, 19.0, 18.0, 20.0, 9.0, 11.0, 13.0, 5.0, 4.0, 4.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.765625, -9.461669921875, -9.15771484375, -8.853759765625, -8.5498046875, -8.245849609375, -7.94189453125, -7.637939453125, -7.333984375, -7.030029296875, -6.72607421875, -6.422119140625, -6.1181640625, -5.814208984375, -5.51025390625, -5.206298828125, -4.90234375, -4.598388671875, -4.29443359375, -3.990478515625, -3.6865234375, -3.382568359375, -3.07861328125, -2.774658203125, -2.470703125, -2.166748046875, -1.86279296875, -1.558837890625, -1.2548828125, -0.950927734375, -0.64697265625, -0.343017578125, -0.0390625, 0.264892578125, 0.56884765625, 0.872802734375, 1.1767578125, 1.480712890625, 1.78466796875, 2.088623046875, 2.392578125, 2.696533203125, 3.00048828125, 3.304443359375, 3.6083984375, 3.912353515625, 4.21630859375, 4.520263671875, 4.82421875, 5.128173828125, 5.43212890625, 5.736083984375, 6.0400390625, 6.343994140625, 6.64794921875, 6.951904296875, 7.255859375, 7.559814453125, 7.86376953125, 8.167724609375, 8.4716796875, 8.775634765625, 9.07958984375, 9.383544921875, 9.6875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 10.0, 12.0, 26.0, 46.0, 86.0, 110.0, 159.0, 156.0, 143.0, 89.0, 60.0, 48.0, 23.0, 11.0, 11.0, 6.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.36907958984375, -50.744483947753906, -49.11988830566406, -47.49529266357422, -45.87069320678711, -44.246097564697266, -42.62150192260742, -40.99690628051758, -39.37230682373047, -37.747711181640625, -36.12311553955078, -34.49851989746094, -32.87392044067383, -31.249324798583984, -29.62472915649414, -28.000133514404297, -26.375537872314453, -24.75094223022461, -23.126344680786133, -21.50174903869629, -19.877151489257812, -18.25255584716797, -16.627960205078125, -15.003363609313965, -13.378767013549805, -11.754170417785645, -10.129573822021484, -8.50497817993164, -6.8803815841674805, -5.25578498840332, -3.6311893463134766, -2.0065927505493164, -0.38199615478515625, 1.2426002025604248, 2.867196559906006, 4.491792678833008, 6.116389274597168, 7.740985870361328, 9.365581512451172, 10.990178108215332, 12.614774703979492, 14.239371299743652, 15.863967895507812, 17.488563537597656, 19.1131591796875, 20.737756729125977, 22.36235237121582, 23.986949920654297, 25.61154556274414, 27.236141204833984, 28.86073875427246, 30.485334396362305, 32.10993194580078, 33.734527587890625, 35.35912322998047, 36.98371887207031, 38.608314514160156, 40.23291015625, 41.857505798339844, 43.48210144042969, 45.1067008972168, 46.73129653930664, 48.355892181396484, 49.98048782348633, 51.60508728027344]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 7.0, 6.0, 12.0, 10.0, 12.0, 11.0, 23.0, 12.0, 24.0, 28.0, 30.0, 29.0, 34.0, 40.0, 30.0, 39.0, 33.0, 38.0, 40.0, 53.0, 43.0, 42.0, 42.0, 49.0, 27.0, 38.0, 35.0, 34.0, 26.0, 19.0, 23.0, 16.0, 18.0, 11.0, 12.0, 8.0, 12.0, 4.0, 13.0, 3.0, 7.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.52053451538086, -20.859607696533203, -20.198678970336914, -19.537752151489258, -18.87682342529297, -18.215896606445312, -17.554969787597656, -16.894041061401367, -16.23311424255371, -15.572186470031738, -14.911258697509766, -14.25033187866211, -13.589404106140137, -12.928476333618164, -12.267548561096191, -11.606620788574219, -10.945693016052246, -10.284765243530273, -9.6238374710083, -8.962909698486328, -8.301982879638672, -7.641055107116699, -6.980127334594727, -6.319200038909912, -5.6582722663879395, -4.997344493865967, -4.336417198181152, -3.6754894256591797, -3.014561891555786, -2.3536343574523926, -1.69270658493042, -1.0317792892456055, -0.3708515167236328, 0.2900760769844055, 0.9510036706924438, 1.611931324005127, 2.2728588581085205, 2.933786392211914, 3.5947141647338867, 4.255641460418701, 4.916569232940674, 5.5774970054626465, 6.238424301147461, 6.899352073669434, 7.560279846191406, 8.221206665039062, 8.882135391235352, 9.543062210083008, 10.20398998260498, 10.864917755126953, 11.525845527648926, 12.186773300170898, 12.847700119018555, 13.508627891540527, 14.1695556640625, 14.830482482910156, 15.491411209106445, 16.1523380279541, 16.81326675415039, 17.474193572998047, 18.135122299194336, 18.796049118041992, 19.45697784423828, 20.117904663085938, 20.778831481933594]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 8.0, 7.0, 13.0, 17.0, 21.0, 38.0, 57.0, 103.0, 111.0, 186.0, 301.0, 514.0, 747.0, 1267.0, 2243.0, 4386.0, 8134.0, 16733.0, 36581.0, 81150.0, 176114.0, 282595.0, 226703.0, 113401.0, 50689.0, 23076.0, 10825.0, 5474.0, 2875.0, 1614.0, 929.0, 573.0, 365.0, 255.0, 142.0, 93.0, 53.0, 58.0, 26.0, 19.0, 11.0, 17.0, 13.0, 6.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.78125, -21.135009765625, -20.48876953125, -19.842529296875, -19.1962890625, -18.550048828125, -17.90380859375, -17.257568359375, -16.611328125, -15.965087890625, -15.31884765625, -14.672607421875, -14.0263671875, -13.380126953125, -12.73388671875, -12.087646484375, -11.44140625, -10.795166015625, -10.14892578125, -9.502685546875, -8.8564453125, -8.210205078125, -7.56396484375, -6.917724609375, -6.271484375, -5.625244140625, -4.97900390625, -4.332763671875, -3.6865234375, -3.040283203125, -2.39404296875, -1.747802734375, -1.1015625, -0.455322265625, 0.19091796875, 0.837158203125, 1.4833984375, 2.129638671875, 2.77587890625, 3.422119140625, 4.068359375, 4.714599609375, 5.36083984375, 6.007080078125, 6.6533203125, 7.299560546875, 7.94580078125, 8.592041015625, 9.23828125, 9.884521484375, 10.53076171875, 11.177001953125, 11.8232421875, 12.469482421875, 13.11572265625, 13.761962890625, 14.408203125, 15.054443359375, 15.70068359375, 16.346923828125, 16.9931640625, 17.639404296875, 18.28564453125, 18.931884765625, 19.578125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 6.0, 9.0, 9.0, 16.0, 10.0, 11.0, 25.0, 25.0, 23.0, 31.0, 51.0, 47.0, 42.0, 58.0, 58.0, 50.0, 72.0, 58.0, 59.0, 66.0, 49.0, 43.0, 35.0, 29.0, 23.0, 31.0, 17.0, 9.0, 11.0, 12.0, 1.0, 6.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-10.84375, -10.544921875, -10.24609375, -9.947265625, -9.6484375, -9.349609375, -9.05078125, -8.751953125, -8.453125, -8.154296875, -7.85546875, -7.556640625, -7.2578125, -6.958984375, -6.66015625, -6.361328125, -6.0625, -5.763671875, -5.46484375, -5.166015625, -4.8671875, -4.568359375, -4.26953125, -3.970703125, -3.671875, -3.373046875, -3.07421875, -2.775390625, -2.4765625, -2.177734375, -1.87890625, -1.580078125, -1.28125, -0.982421875, -0.68359375, -0.384765625, -0.0859375, 0.212890625, 0.51171875, 0.810546875, 1.109375, 1.408203125, 1.70703125, 2.005859375, 2.3046875, 2.603515625, 2.90234375, 3.201171875, 3.5, 3.798828125, 4.09765625, 4.396484375, 4.6953125, 4.994140625, 5.29296875, 5.591796875, 5.890625, 6.189453125, 6.48828125, 6.787109375, 7.0859375, 7.384765625, 7.68359375, 7.982421875, 8.28125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 9.0, 8.0, 7.0, 17.0, 20.0, 21.0, 30.0, 42.0, 56.0, 72.0, 131.0, 218.0, 360.0, 578.0, 1119.0, 2739.0, 10120.0, 69980.0, 637419.0, 287497.0, 28647.0, 5594.0, 1747.0, 858.0, 461.0, 259.0, 161.0, 118.0, 72.0, 57.0, 26.0, 33.0, 13.0, 7.0, 8.0, 8.0, 9.0, 6.0, 4.0, 1.0, 3.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-67.5625, -65.56298828125, -63.5634765625, -61.56396484375, -59.564453125, -57.56494140625, -55.5654296875, -53.56591796875, -51.56640625, -49.56689453125, -47.5673828125, -45.56787109375, -43.568359375, -41.56884765625, -39.5693359375, -37.56982421875, -35.5703125, -33.57080078125, -31.5712890625, -29.57177734375, -27.572265625, -25.57275390625, -23.5732421875, -21.57373046875, -19.57421875, -17.57470703125, -15.5751953125, -13.57568359375, -11.576171875, -9.57666015625, -7.5771484375, -5.57763671875, -3.578125, -1.57861328125, 0.4208984375, 2.42041015625, 4.419921875, 6.41943359375, 8.4189453125, 10.41845703125, 12.41796875, 14.41748046875, 16.4169921875, 18.41650390625, 20.416015625, 22.41552734375, 24.4150390625, 26.41455078125, 28.4140625, 30.41357421875, 32.4130859375, 34.41259765625, 36.412109375, 38.41162109375, 40.4111328125, 42.41064453125, 44.41015625, 46.40966796875, 48.4091796875, 50.40869140625, 52.408203125, 54.40771484375, 56.4072265625, 58.40673828125, 60.40625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 9.0, 13.0, 19.0, 27.0, 41.0, 37.0, 41.0, 49.0, 60.0, 49.0, 76.0, 50.0, 65.0, 62.0, 63.0, 56.0, 49.0, 45.0, 36.0, 31.0, 20.0, 17.0, 19.0, 20.0, 14.0, 6.0, 3.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-72.125, -70.28271484375, -68.4404296875, -66.59814453125, -64.755859375, -62.91357421875, -61.0712890625, -59.22900390625, -57.38671875, -55.54443359375, -53.7021484375, -51.85986328125, -50.017578125, -48.17529296875, -46.3330078125, -44.49072265625, -42.6484375, -40.80615234375, -38.9638671875, -37.12158203125, -35.279296875, -33.43701171875, -31.5947265625, -29.75244140625, -27.91015625, -26.06787109375, -24.2255859375, -22.38330078125, -20.541015625, -18.69873046875, -16.8564453125, -15.01416015625, -13.171875, -11.32958984375, -9.4873046875, -7.64501953125, -5.802734375, -3.96044921875, -2.1181640625, -0.27587890625, 1.56640625, 3.40869140625, 5.2509765625, 7.09326171875, 8.935546875, 10.77783203125, 12.6201171875, 14.46240234375, 16.3046875, 18.14697265625, 19.9892578125, 21.83154296875, 23.673828125, 25.51611328125, 27.3583984375, 29.20068359375, 31.04296875, 32.88525390625, 34.7275390625, 36.56982421875, 38.412109375, 40.25439453125, 42.0966796875, 43.93896484375, 45.78125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 17.0, 24.0, 35.0, 52.0, 132.0, 266.0, 643.0, 2669.0, 23152.0, 790295.0, 219842.0, 9127.0, 1433.0, 457.0, 182.0, 91.0, 43.0, 39.0, 19.0, 14.0, 8.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.8125, -37.111328125, -35.41015625, -33.708984375, -32.0078125, -30.306640625, -28.60546875, -26.904296875, -25.203125, -23.501953125, -21.80078125, -20.099609375, -18.3984375, -16.697265625, -14.99609375, -13.294921875, -11.59375, -9.892578125, -8.19140625, -6.490234375, -4.7890625, -3.087890625, -1.38671875, 0.314453125, 2.015625, 3.716796875, 5.41796875, 7.119140625, 8.8203125, 10.521484375, 12.22265625, 13.923828125, 15.625, 17.326171875, 19.02734375, 20.728515625, 22.4296875, 24.130859375, 25.83203125, 27.533203125, 29.234375, 30.935546875, 32.63671875, 34.337890625, 36.0390625, 37.740234375, 39.44140625, 41.142578125, 42.84375, 44.544921875, 46.24609375, 47.947265625, 49.6484375, 51.349609375, 53.05078125, 54.751953125, 56.453125, 58.154296875, 59.85546875, 61.556640625, 63.2578125, 64.958984375, 66.66015625, 68.361328125, 70.0625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 8.0, 14.0, 11.0, 28.0, 45.0, 82.0, 108.0, 151.0, 174.0, 123.0, 103.0, 71.0, 35.0, 23.0, 13.0, 10.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002742767333984375, -0.002551734447479248, -0.002360701560974121, -0.002169668674468994, -0.001978635787963867, -0.0017876029014587402, -0.0015965700149536133, -0.0014055371284484863, -0.0012145042419433594, -0.0010234713554382324, -0.0008324384689331055, -0.0006414055824279785, -0.00045037269592285156, -0.0002593398094177246, -6.830692291259766e-05, 0.0001227259635925293, 0.00031375885009765625, 0.0005047917366027832, 0.0006958246231079102, 0.0008868575096130371, 0.001077890396118164, 0.001268923282623291, 0.001459956169128418, 0.001650989055633545, 0.0018420219421386719, 0.002033054828643799, 0.0022240877151489258, 0.0024151206016540527, 0.0026061534881591797, 0.0027971863746643066, 0.0029882192611694336, 0.0031792521476745605, 0.0033702850341796875, 0.0035613179206848145, 0.0037523508071899414, 0.003943383693695068, 0.004134416580200195, 0.004325449466705322, 0.004516482353210449, 0.004707515239715576, 0.004898548126220703, 0.00508958101272583, 0.005280613899230957, 0.005471646785736084, 0.005662679672241211, 0.005853712558746338, 0.006044745445251465, 0.006235778331756592, 0.006426811218261719, 0.006617844104766846, 0.006808876991271973, 0.0069999098777771, 0.0071909427642822266, 0.0073819756507873535, 0.0075730085372924805, 0.007764041423797607, 0.007955074310302734, 0.008146107196807861, 0.008337140083312988, 0.008528172969818115, 0.008719205856323242, 0.00891023874282837, 0.009101271629333496, 0.009292304515838623, 0.00948333740234375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 8.0, 7.0, 16.0, 26.0, 34.0, 41.0, 70.0, 74.0, 133.0, 209.0, 382.0, 658.0, 1305.0, 3105.0, 9403.0, 41141.0, 357857.0, 553533.0, 60908.0, 12493.0, 3772.0, 1512.0, 727.0, 413.0, 244.0, 163.0, 93.0, 59.0, 46.0, 30.0, 23.0, 16.0, 11.0, 10.0, 7.0, 7.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-27.8125, -26.972412109375, -26.13232421875, -25.292236328125, -24.4521484375, -23.612060546875, -22.77197265625, -21.931884765625, -21.091796875, -20.251708984375, -19.41162109375, -18.571533203125, -17.7314453125, -16.891357421875, -16.05126953125, -15.211181640625, -14.37109375, -13.531005859375, -12.69091796875, -11.850830078125, -11.0107421875, -10.170654296875, -9.33056640625, -8.490478515625, -7.650390625, -6.810302734375, -5.97021484375, -5.130126953125, -4.2900390625, -3.449951171875, -2.60986328125, -1.769775390625, -0.9296875, -0.089599609375, 0.75048828125, 1.590576171875, 2.4306640625, 3.270751953125, 4.11083984375, 4.950927734375, 5.791015625, 6.631103515625, 7.47119140625, 8.311279296875, 9.1513671875, 9.991455078125, 10.83154296875, 11.671630859375, 12.51171875, 13.351806640625, 14.19189453125, 15.031982421875, 15.8720703125, 16.712158203125, 17.55224609375, 18.392333984375, 19.232421875, 20.072509765625, 20.91259765625, 21.752685546875, 22.5927734375, 23.432861328125, 24.27294921875, 25.113037109375, 25.953125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 3.0, 8.0, 16.0, 19.0, 25.0, 42.0, 40.0, 65.0, 68.0, 109.0, 125.0, 113.0, 90.0, 74.0, 59.0, 38.0, 31.0, 21.0, 11.0, 11.0, 4.0, 6.0, 7.0, 4.0, 4.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.484375, -27.535400390625, -26.58642578125, -25.637451171875, -24.6884765625, -23.739501953125, -22.79052734375, -21.841552734375, -20.892578125, -19.943603515625, -18.99462890625, -18.045654296875, -17.0966796875, -16.147705078125, -15.19873046875, -14.249755859375, -13.30078125, -12.351806640625, -11.40283203125, -10.453857421875, -9.5048828125, -8.555908203125, -7.60693359375, -6.657958984375, -5.708984375, -4.760009765625, -3.81103515625, -2.862060546875, -1.9130859375, -0.964111328125, -0.01513671875, 0.933837890625, 1.8828125, 2.831787109375, 3.78076171875, 4.729736328125, 5.6787109375, 6.627685546875, 7.57666015625, 8.525634765625, 9.474609375, 10.423583984375, 11.37255859375, 12.321533203125, 13.2705078125, 14.219482421875, 15.16845703125, 16.117431640625, 17.06640625, 18.015380859375, 18.96435546875, 19.913330078125, 20.8623046875, 21.811279296875, 22.76025390625, 23.709228515625, 24.658203125, 25.607177734375, 26.55615234375, 27.505126953125, 28.4541015625, 29.403076171875, 30.35205078125, 31.301025390625, 32.25]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 13.0, 23.0, 121.0, 343.0, 363.0, 122.0, 24.0, 6.0, 1.0, 1.0, 1.0], "bins": [-2298.83251953125, -2258.530517578125, -2218.228271484375, -2177.92626953125, -2137.6240234375, -2097.322021484375, -2057.019775390625, -2016.7177734375, -1976.4156494140625, -1936.113525390625, -1895.8114013671875, -1855.50927734375, -1815.2071533203125, -1774.905029296875, -1734.60302734375, -1694.3009033203125, -1653.998779296875, -1613.6966552734375, -1573.39453125, -1533.0924072265625, -1492.790283203125, -1452.48828125, -1412.18603515625, -1371.884033203125, -1331.581787109375, -1291.2796630859375, -1250.9775390625, -1210.6754150390625, -1170.373291015625, -1130.0712890625, -1089.76904296875, -1049.467041015625, -1009.1649169921875, -968.86279296875, -928.5606689453125, -888.258544921875, -847.9564819335938, -807.6543579101562, -767.3522338867188, -727.0501708984375, -686.748046875, -646.4459228515625, -606.143798828125, -565.8416748046875, -525.5396118164062, -485.23748779296875, -444.93536376953125, -404.6332702636719, -364.33111572265625, -324.02899169921875, -283.7268981933594, -243.42477416992188, -203.12266540527344, -162.820556640625, -122.5184326171875, -82.21633911132812, -41.914215087890625, -1.6121025085449219, 38.69001007080078, 78.99212646484375, 119.29423522949219, 159.59634399414062, 199.89846801757812, 240.2005615234375, 280.502685546875]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 4.0, 8.0, 4.0, 8.0, 13.0, 13.0, 17.0, 23.0, 22.0, 20.0, 24.0, 24.0, 40.0, 48.0, 29.0, 43.0, 41.0, 52.0, 43.0, 47.0, 42.0, 45.0, 49.0, 40.0, 37.0, 26.0, 36.0, 26.0, 29.0, 28.0, 19.0, 21.0, 16.0, 11.0, 10.0, 13.0, 7.0, 9.0, 4.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-199.07492065429688, -192.99472045898438, -186.91453552246094, -180.83433532714844, -174.754150390625, -168.6739501953125, -162.59375, -156.5135498046875, -150.43336486816406, -144.35316467285156, -138.27297973632812, -132.19277954101562, -126.11258697509766, -120.03239440917969, -113.95219421386719, -107.87200164794922, -101.79180908203125, -95.71161651611328, -89.63142395019531, -83.55122375488281, -77.47103118896484, -71.39083862304688, -65.31063842773438, -59.230445861816406, -53.15025329589844, -47.07006072998047, -40.989864349365234, -34.90966796875, -28.82947540283203, -22.74928092956543, -16.669086456298828, -10.588890075683594, -4.508697509765625, 1.5714969635009766, 7.651691436767578, 13.73188591003418, 19.81208038330078, 25.892274856567383, 31.972469329833984, 38.05266571044922, 44.13285827636719, 50.213050842285156, 56.29324722290039, 62.373443603515625, 68.4536361694336, 74.53382873535156, 80.61402893066406, 86.69422149658203, 92.7744140625, 98.85460662841797, 104.93479919433594, 111.01499938964844, 117.0951919555664, 123.17538452148438, 129.25558471679688, 135.33578491210938, 141.4159698486328, 147.4961700439453, 153.57635498046875, 159.65655517578125, 165.73675537109375, 171.8169403076172, 177.8971405029297, 183.97732543945312, 190.05752563476562]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 13.0, 15.0, 13.0, 21.0, 25.0, 41.0, 63.0, 72.0, 83.0, 165.0, 224.0, 330.0, 579.0, 902.0, 1651.0, 3321.0, 7504.0, 25089.0, 4113475.0, 25804.0, 7407.0, 3216.0, 1727.0, 914.0, 555.0, 304.0, 246.0, 161.0, 102.0, 72.0, 51.0, 30.0, 37.0, 11.0, 9.0, 12.0, 2.0, 8.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.28125, -46.6982421875, -45.115234375, -43.5322265625, -41.94921875, -40.3662109375, -38.783203125, -37.2001953125, -35.6171875, -34.0341796875, -32.451171875, -30.8681640625, -29.28515625, -27.7021484375, -26.119140625, -24.5361328125, -22.953125, -21.3701171875, -19.787109375, -18.2041015625, -16.62109375, -15.0380859375, -13.455078125, -11.8720703125, -10.2890625, -8.7060546875, -7.123046875, -5.5400390625, -3.95703125, -2.3740234375, -0.791015625, 0.7919921875, 2.375, 3.9580078125, 5.541015625, 7.1240234375, 8.70703125, 10.2900390625, 11.873046875, 13.4560546875, 15.0390625, 16.6220703125, 18.205078125, 19.7880859375, 21.37109375, 22.9541015625, 24.537109375, 26.1201171875, 27.703125, 29.2861328125, 30.869140625, 32.4521484375, 34.03515625, 35.6181640625, 37.201171875, 38.7841796875, 40.3671875, 41.9501953125, 43.533203125, 45.1162109375, 46.69921875, 48.2822265625, 49.865234375, 51.4482421875, 53.03125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 8.0, 14.0, 14.0, 19.0, 14.0, 33.0, 26.0, 35.0, 62.0, 51.0, 57.0, 80.0, 72.0, 66.0, 65.0, 69.0, 65.0, 46.0, 42.0, 38.0, 25.0, 27.0, 15.0, 11.0, 14.0, 10.0, 7.0, 6.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.8671875, -12.5009765625, -12.134765625, -11.7685546875, -11.40234375, -11.0361328125, -10.669921875, -10.3037109375, -9.9375, -9.5712890625, -9.205078125, -8.8388671875, -8.47265625, -8.1064453125, -7.740234375, -7.3740234375, -7.0078125, -6.6416015625, -6.275390625, -5.9091796875, -5.54296875, -5.1767578125, -4.810546875, -4.4443359375, -4.078125, -3.7119140625, -3.345703125, -2.9794921875, -2.61328125, -2.2470703125, -1.880859375, -1.5146484375, -1.1484375, -0.7822265625, -0.416015625, -0.0498046875, 0.31640625, 0.6826171875, 1.048828125, 1.4150390625, 1.78125, 2.1474609375, 2.513671875, 2.8798828125, 3.24609375, 3.6123046875, 3.978515625, 4.3447265625, 4.7109375, 5.0771484375, 5.443359375, 5.8095703125, 6.17578125, 6.5419921875, 6.908203125, 7.2744140625, 7.640625, 8.0068359375, 8.373046875, 8.7392578125, 9.10546875, 9.4716796875, 9.837890625, 10.2041015625, 10.5703125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 7.0, 6.0, 7.0, 13.0, 29.0, 24.0, 34.0, 49.0, 69.0, 75.0, 137.0, 201.0, 266.0, 438.0, 625.0, 1009.0, 1688.0, 3218.0, 7568.0, 29763.0, 4087975.0, 42788.0, 9327.0, 3737.0, 1979.0, 1115.0, 677.0, 443.0, 319.0, 214.0, 152.0, 91.0, 74.0, 45.0, 33.0, 19.0, 13.0, 11.0, 11.0, 8.0, 6.0, 7.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-47.34375, -45.68798828125, -44.0322265625, -42.37646484375, -40.720703125, -39.06494140625, -37.4091796875, -35.75341796875, -34.09765625, -32.44189453125, -30.7861328125, -29.13037109375, -27.474609375, -25.81884765625, -24.1630859375, -22.50732421875, -20.8515625, -19.19580078125, -17.5400390625, -15.88427734375, -14.228515625, -12.57275390625, -10.9169921875, -9.26123046875, -7.60546875, -5.94970703125, -4.2939453125, -2.63818359375, -0.982421875, 0.67333984375, 2.3291015625, 3.98486328125, 5.640625, 7.29638671875, 8.9521484375, 10.60791015625, 12.263671875, 13.91943359375, 15.5751953125, 17.23095703125, 18.88671875, 20.54248046875, 22.1982421875, 23.85400390625, 25.509765625, 27.16552734375, 28.8212890625, 30.47705078125, 32.1328125, 33.78857421875, 35.4443359375, 37.10009765625, 38.755859375, 40.41162109375, 42.0673828125, 43.72314453125, 45.37890625, 47.03466796875, 48.6904296875, 50.34619140625, 52.001953125, 53.65771484375, 55.3134765625, 56.96923828125, 58.625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 5.0, 5.0, 9.0, 22.0, 21.0, 59.0, 3811.0, 74.0, 25.0, 12.0, 8.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.453125, -15.977783203125, -15.50244140625, -15.027099609375, -14.5517578125, -14.076416015625, -13.60107421875, -13.125732421875, -12.650390625, -12.175048828125, -11.69970703125, -11.224365234375, -10.7490234375, -10.273681640625, -9.79833984375, -9.322998046875, -8.84765625, -8.372314453125, -7.89697265625, -7.421630859375, -6.9462890625, -6.470947265625, -5.99560546875, -5.520263671875, -5.044921875, -4.569580078125, -4.09423828125, -3.618896484375, -3.1435546875, -2.668212890625, -2.19287109375, -1.717529296875, -1.2421875, -0.766845703125, -0.29150390625, 0.183837890625, 0.6591796875, 1.134521484375, 1.60986328125, 2.085205078125, 2.560546875, 3.035888671875, 3.51123046875, 3.986572265625, 4.4619140625, 4.937255859375, 5.41259765625, 5.887939453125, 6.36328125, 6.838623046875, 7.31396484375, 7.789306640625, 8.2646484375, 8.739990234375, 9.21533203125, 9.690673828125, 10.166015625, 10.641357421875, 11.11669921875, 11.592041015625, 12.0673828125, 12.542724609375, 13.01806640625, 13.493408203125, 13.96875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 9.0, 4.0, 13.0, 41.0, 126.0, 279.0, 276.0, 166.0, 57.0, 22.0, 8.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.8508071899414, -83.77415466308594, -80.69749450683594, -77.62084197998047, -74.544189453125, -71.46753692626953, -68.39088439941406, -65.31422424316406, -62.237571716308594, -59.160919189453125, -56.08426284790039, -53.007606506347656, -49.93095397949219, -46.85430145263672, -43.777645111083984, -40.70098876953125, -37.62433624267578, -34.54768371582031, -31.471027374267578, -28.394372940063477, -25.317718505859375, -22.241064071655273, -19.164409637451172, -16.08775520324707, -13.011100769042969, -9.934446334838867, -6.857791900634766, -3.781137466430664, -0.7044830322265625, 2.372171401977539, 5.448825836181641, 8.525480270385742, 11.602134704589844, 14.678789138793945, 17.755443572998047, 20.83209800720215, 23.90875244140625, 26.98540687561035, 30.062061309814453, 33.13871765136719, 36.215370178222656, 39.292022705078125, 42.36867904663086, 45.445335388183594, 48.52198791503906, 51.59864044189453, 54.675296783447266, 57.751953125, 60.82860565185547, 63.90525817871094, 66.98191833496094, 70.0585708618164, 73.13522338867188, 76.21187591552734, 79.28852844238281, 82.36518859863281, 85.44184112548828, 88.51849365234375, 91.59515380859375, 94.67180633544922, 97.74845886230469, 100.82511138916016, 103.90176391601562, 106.97842407226562, 110.0550765991211]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 9.0, 6.0, 7.0, 9.0, 14.0, 12.0, 18.0, 26.0, 31.0, 31.0, 34.0, 60.0, 36.0, 62.0, 57.0, 56.0, 61.0, 48.0, 56.0, 61.0, 49.0, 58.0, 33.0, 32.0, 32.0, 32.0, 17.0, 13.0, 9.0, 9.0, 7.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.085403442382812, -26.19303321838379, -25.300662994384766, -24.408292770385742, -23.51592254638672, -22.623552322387695, -21.731182098388672, -20.838809967041016, -19.946441650390625, -19.0540714263916, -18.161701202392578, -17.269330978393555, -16.37696075439453, -15.484590530395508, -14.592219352722168, -13.699849128723145, -12.807477951049805, -11.915107727050781, -11.022737503051758, -10.130367279052734, -9.237997055053711, -8.345626831054688, -7.453255653381348, -6.560885429382324, -5.668515205383301, -4.776144981384277, -3.883774518966675, -2.9914040565490723, -2.099033832550049, -1.2066636085510254, -0.31429290771484375, 0.5780773162841797, 1.4704456329345703, 2.3628158569335938, 3.2551863193511963, 4.147556781768799, 5.039927005767822, 5.932297229766846, 6.824667930603027, 7.717038154602051, 8.609408378601074, 9.501778602600098, 10.394148826599121, 11.286520004272461, 12.178890228271484, 13.071260452270508, 13.963630676269531, 14.856000900268555, 15.748371124267578, 16.6407413482666, 17.533111572265625, 18.42548179626465, 19.317852020263672, 20.210222244262695, 21.10259246826172, 21.994964599609375, 22.887332916259766, 23.77970314025879, 24.672073364257812, 25.564443588256836, 26.45681381225586, 27.349184036254883, 28.241554260253906, 29.133926391601562, 30.026296615600586]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 4.0, 6.0, 11.0, 9.0, 13.0, 35.0, 30.0, 50.0, 84.0, 122.0, 207.0, 377.0, 608.0, 1075.0, 1913.0, 3732.0, 7892.0, 17707.0, 41389.0, 106023.0, 256060.0, 330949.0, 165575.0, 65503.0, 26293.0, 11509.0, 5329.0, 2572.0, 1396.0, 798.0, 467.0, 290.0, 184.0, 116.0, 88.0, 49.0, 34.0, 21.0, 10.0, 6.0, 8.0, 9.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-29.359375, -28.501953125, -27.64453125, -26.787109375, -25.9296875, -25.072265625, -24.21484375, -23.357421875, -22.5, -21.642578125, -20.78515625, -19.927734375, -19.0703125, -18.212890625, -17.35546875, -16.498046875, -15.640625, -14.783203125, -13.92578125, -13.068359375, -12.2109375, -11.353515625, -10.49609375, -9.638671875, -8.78125, -7.923828125, -7.06640625, -6.208984375, -5.3515625, -4.494140625, -3.63671875, -2.779296875, -1.921875, -1.064453125, -0.20703125, 0.650390625, 1.5078125, 2.365234375, 3.22265625, 4.080078125, 4.9375, 5.794921875, 6.65234375, 7.509765625, 8.3671875, 9.224609375, 10.08203125, 10.939453125, 11.796875, 12.654296875, 13.51171875, 14.369140625, 15.2265625, 16.083984375, 16.94140625, 17.798828125, 18.65625, 19.513671875, 20.37109375, 21.228515625, 22.0859375, 22.943359375, 23.80078125, 24.658203125, 25.515625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 0.0, 0.0, 5.0, 4.0, 3.0, 7.0, 9.0, 9.0, 5.0, 17.0, 15.0, 25.0, 28.0, 38.0, 44.0, 50.0, 56.0, 54.0, 70.0, 68.0, 56.0, 69.0, 67.0, 59.0, 53.0, 40.0, 31.0, 29.0, 27.0, 15.0, 16.0, 11.0, 6.0, 8.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.0, -12.6279296875, -12.255859375, -11.8837890625, -11.51171875, -11.1396484375, -10.767578125, -10.3955078125, -10.0234375, -9.6513671875, -9.279296875, -8.9072265625, -8.53515625, -8.1630859375, -7.791015625, -7.4189453125, -7.046875, -6.6748046875, -6.302734375, -5.9306640625, -5.55859375, -5.1865234375, -4.814453125, -4.4423828125, -4.0703125, -3.6982421875, -3.326171875, -2.9541015625, -2.58203125, -2.2099609375, -1.837890625, -1.4658203125, -1.09375, -0.7216796875, -0.349609375, 0.0224609375, 0.39453125, 0.7666015625, 1.138671875, 1.5107421875, 1.8828125, 2.2548828125, 2.626953125, 2.9990234375, 3.37109375, 3.7431640625, 4.115234375, 4.4873046875, 4.859375, 5.2314453125, 5.603515625, 5.9755859375, 6.34765625, 6.7197265625, 7.091796875, 7.4638671875, 7.8359375, 8.2080078125, 8.580078125, 8.9521484375, 9.32421875, 9.6962890625, 10.068359375, 10.4404296875, 10.8125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 11.0, 12.0, 25.0, 38.0, 38.0, 71.0, 108.0, 184.0, 382.0, 686.0, 1587.0, 5890.0, 49166.0, 710908.0, 256808.0, 17299.0, 3099.0, 1047.0, 543.0, 278.0, 140.0, 70.0, 57.0, 36.0, 18.0, 5.0, 11.0, 16.0, 5.0, 3.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-94.125, -91.6337890625, -89.142578125, -86.6513671875, -84.16015625, -81.6689453125, -79.177734375, -76.6865234375, -74.1953125, -71.7041015625, -69.212890625, -66.7216796875, -64.23046875, -61.7392578125, -59.248046875, -56.7568359375, -54.265625, -51.7744140625, -49.283203125, -46.7919921875, -44.30078125, -41.8095703125, -39.318359375, -36.8271484375, -34.3359375, -31.8447265625, -29.353515625, -26.8623046875, -24.37109375, -21.8798828125, -19.388671875, -16.8974609375, -14.40625, -11.9150390625, -9.423828125, -6.9326171875, -4.44140625, -1.9501953125, 0.541015625, 3.0322265625, 5.5234375, 8.0146484375, 10.505859375, 12.9970703125, 15.48828125, 17.9794921875, 20.470703125, 22.9619140625, 25.453125, 27.9443359375, 30.435546875, 32.9267578125, 35.41796875, 37.9091796875, 40.400390625, 42.8916015625, 45.3828125, 47.8740234375, 50.365234375, 52.8564453125, 55.34765625, 57.8388671875, 60.330078125, 62.8212890625, 65.3125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 6.0, 6.0, 16.0, 13.0, 9.0, 19.0, 23.0, 33.0, 32.0, 47.0, 57.0, 69.0, 52.0, 50.0, 68.0, 67.0, 54.0, 53.0, 59.0, 47.0, 44.0, 34.0, 29.0, 20.0, 21.0, 14.0, 9.0, 12.0, 9.0, 2.0, 3.0, 7.0, 4.0, 4.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.25, -51.181640625, -49.11328125, -47.044921875, -44.9765625, -42.908203125, -40.83984375, -38.771484375, -36.703125, -34.634765625, -32.56640625, -30.498046875, -28.4296875, -26.361328125, -24.29296875, -22.224609375, -20.15625, -18.087890625, -16.01953125, -13.951171875, -11.8828125, -9.814453125, -7.74609375, -5.677734375, -3.609375, -1.541015625, 0.52734375, 2.595703125, 4.6640625, 6.732421875, 8.80078125, 10.869140625, 12.9375, 15.005859375, 17.07421875, 19.142578125, 21.2109375, 23.279296875, 25.34765625, 27.416015625, 29.484375, 31.552734375, 33.62109375, 35.689453125, 37.7578125, 39.826171875, 41.89453125, 43.962890625, 46.03125, 48.099609375, 50.16796875, 52.236328125, 54.3046875, 56.373046875, 58.44140625, 60.509765625, 62.578125, 64.646484375, 66.71484375, 68.783203125, 70.8515625, 72.919921875, 74.98828125, 77.056640625, 79.125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 6.0, 5.0, 6.0, 12.0, 16.0, 18.0, 27.0, 25.0, 52.0, 78.0, 100.0, 173.0, 324.0, 708.0, 2201.0, 10364.0, 162290.0, 838363.0, 27309.0, 4154.0, 1095.0, 523.0, 248.0, 152.0, 71.0, 57.0, 37.0, 29.0, 15.0, 21.0, 21.0, 13.0, 9.0, 5.0, 4.0, 9.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.5, -63.40234375, -61.3046875, -59.20703125, -57.109375, -55.01171875, -52.9140625, -50.81640625, -48.71875, -46.62109375, -44.5234375, -42.42578125, -40.328125, -38.23046875, -36.1328125, -34.03515625, -31.9375, -29.83984375, -27.7421875, -25.64453125, -23.546875, -21.44921875, -19.3515625, -17.25390625, -15.15625, -13.05859375, -10.9609375, -8.86328125, -6.765625, -4.66796875, -2.5703125, -0.47265625, 1.625, 3.72265625, 5.8203125, 7.91796875, 10.015625, 12.11328125, 14.2109375, 16.30859375, 18.40625, 20.50390625, 22.6015625, 24.69921875, 26.796875, 28.89453125, 30.9921875, 33.08984375, 35.1875, 37.28515625, 39.3828125, 41.48046875, 43.578125, 45.67578125, 47.7734375, 49.87109375, 51.96875, 54.06640625, 56.1640625, 58.26171875, 60.359375, 62.45703125, 64.5546875, 66.65234375, 68.75]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 5.0, 8.0, 8.0, 8.0, 6.0, 20.0, 34.0, 30.0, 59.0, 82.0, 81.0, 120.0, 112.0, 119.0, 71.0, 63.0, 56.0, 28.0, 24.0, 13.0, 9.0, 12.0, 10.0, 2.0, 5.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00437164306640625, -0.004221498966217041, -0.004071354866027832, -0.003921210765838623, -0.003771066665649414, -0.003620922565460205, -0.003470778465270996, -0.003320634365081787, -0.003170490264892578, -0.003020346164703369, -0.00287020206451416, -0.002720057964324951, -0.002569913864135742, -0.002419769763946533, -0.0022696256637573242, -0.0021194815635681152, -0.0019693374633789062, -0.0018191933631896973, -0.0016690492630004883, -0.0015189051628112793, -0.0013687610626220703, -0.0012186169624328613, -0.0010684728622436523, -0.0009183287620544434, -0.0007681846618652344, -0.0006180405616760254, -0.0004678964614868164, -0.0003177523612976074, -0.00016760826110839844, -1.7464160919189453e-05, 0.00013267993927001953, 0.0002828240394592285, 0.0004329681396484375, 0.0005831122398376465, 0.0007332563400268555, 0.0008834004402160645, 0.0010335445404052734, 0.0011836886405944824, 0.0013338327407836914, 0.0014839768409729004, 0.0016341209411621094, 0.0017842650413513184, 0.0019344091415405273, 0.0020845532417297363, 0.0022346973419189453, 0.0023848414421081543, 0.0025349855422973633, 0.0026851296424865723, 0.0028352737426757812, 0.0029854178428649902, 0.0031355619430541992, 0.003285706043243408, 0.003435850143432617, 0.003585994243621826, 0.003736138343811035, 0.003886282444000244, 0.004036426544189453, 0.004186570644378662, 0.004336714744567871, 0.00448685884475708, 0.004637002944946289, 0.004787147045135498, 0.004937291145324707, 0.005087435245513916, 0.005237579345703125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 7.0, 5.0, 9.0, 7.0, 10.0, 25.0, 31.0, 40.0, 59.0, 84.0, 115.0, 174.0, 307.0, 540.0, 1171.0, 3123.0, 11425.0, 82437.0, 842212.0, 88967.0, 11889.0, 3225.0, 1239.0, 582.0, 306.0, 176.0, 112.0, 74.0, 58.0, 47.0, 33.0, 13.0, 12.0, 9.0, 6.0, 11.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.65625, -45.17578125, -43.6953125, -42.21484375, -40.734375, -39.25390625, -37.7734375, -36.29296875, -34.8125, -33.33203125, -31.8515625, -30.37109375, -28.890625, -27.41015625, -25.9296875, -24.44921875, -22.96875, -21.48828125, -20.0078125, -18.52734375, -17.046875, -15.56640625, -14.0859375, -12.60546875, -11.125, -9.64453125, -8.1640625, -6.68359375, -5.203125, -3.72265625, -2.2421875, -0.76171875, 0.71875, 2.19921875, 3.6796875, 5.16015625, 6.640625, 8.12109375, 9.6015625, 11.08203125, 12.5625, 14.04296875, 15.5234375, 17.00390625, 18.484375, 19.96484375, 21.4453125, 22.92578125, 24.40625, 25.88671875, 27.3671875, 28.84765625, 30.328125, 31.80859375, 33.2890625, 34.76953125, 36.25, 37.73046875, 39.2109375, 40.69140625, 42.171875, 43.65234375, 45.1328125, 46.61328125, 48.09375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 3.0, 5.0, 4.0, 5.0, 8.0, 7.0, 14.0, 13.0, 25.0, 42.0, 64.0, 106.0, 152.0, 150.0, 129.0, 105.0, 47.0, 28.0, 22.0, 14.0, 13.0, 8.0, 6.0, 2.0, 6.0, 2.0, 5.0, 2.0, 1.0, 2.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.9375, -41.2314453125, -39.525390625, -37.8193359375, -36.11328125, -34.4072265625, -32.701171875, -30.9951171875, -29.2890625, -27.5830078125, -25.876953125, -24.1708984375, -22.46484375, -20.7587890625, -19.052734375, -17.3466796875, -15.640625, -13.9345703125, -12.228515625, -10.5224609375, -8.81640625, -7.1103515625, -5.404296875, -3.6982421875, -1.9921875, -0.2861328125, 1.419921875, 3.1259765625, 4.83203125, 6.5380859375, 8.244140625, 9.9501953125, 11.65625, 13.3623046875, 15.068359375, 16.7744140625, 18.48046875, 20.1865234375, 21.892578125, 23.5986328125, 25.3046875, 27.0107421875, 28.716796875, 30.4228515625, 32.12890625, 33.8349609375, 35.541015625, 37.2470703125, 38.953125, 40.6591796875, 42.365234375, 44.0712890625, 45.77734375, 47.4833984375, 49.189453125, 50.8955078125, 52.6015625, 54.3076171875, 56.013671875, 57.7197265625, 59.42578125, 61.1318359375, 62.837890625, 64.5439453125, 66.25]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 12.0, 90.0, 558.0, 306.0, 36.0, 8.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3095.76416015625, -3032.334228515625, -2968.904052734375, -2905.47412109375, -2842.044189453125, -2778.614013671875, -2715.18408203125, -2651.754150390625, -2588.323974609375, -2524.89404296875, -2461.4638671875, -2398.033935546875, -2334.60400390625, -2271.173828125, -2207.743896484375, -2144.31396484375, -2080.884033203125, -2017.4539794921875, -1954.0240478515625, -1890.593994140625, -1827.1639404296875, -1763.7340087890625, -1700.303955078125, -1636.8740234375, -1573.44384765625, -1510.0137939453125, -1446.5838623046875, -1383.15380859375, -1319.7237548828125, -1256.2938232421875, -1192.86376953125, -1129.433837890625, -1066.0037841796875, -1002.5737915039062, -939.1437377929688, -875.7137451171875, -812.2837524414062, -748.853759765625, -685.4237060546875, -621.9937133789062, -558.563720703125, -495.1336975097656, -431.7037048339844, -368.273681640625, -304.84368896484375, -241.41366577148438, -177.983642578125, -114.55364990234375, -51.12359619140625, 12.306415557861328, 75.7364273071289, 139.16644287109375, 202.59645080566406, 266.0264587402344, 329.45648193359375, 392.886474609375, 456.3164978027344, 519.7465209960938, 583.176513671875, 646.6065673828125, 710.0365600585938, 773.466552734375, 836.8966064453125, 900.3265380859375, 963.756591796875]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 6.0, 5.0, 4.0, 5.0, 7.0, 8.0, 13.0, 14.0, 16.0, 16.0, 23.0, 26.0, 43.0, 30.0, 45.0, 43.0, 51.0, 47.0, 55.0, 53.0, 55.0, 55.0, 42.0, 41.0, 27.0, 46.0, 30.0, 37.0, 33.0, 28.0, 22.0, 14.0, 12.0, 13.0, 9.0, 5.0, 6.0, 7.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-270.54229736328125, -262.680419921875, -254.81851196289062, -246.9566192626953, -239.0947265625, -231.23284912109375, -223.37094116210938, -215.50906372070312, -207.6471710205078, -199.7852783203125, -191.9233856201172, -184.06149291992188, -176.19960021972656, -168.33770751953125, -160.475830078125, -152.6139373779297, -144.75204467773438, -136.89015197753906, -129.02825927734375, -121.16636657714844, -113.30448150634766, -105.44258880615234, -97.58069610595703, -89.71881103515625, -81.85690307617188, -73.99501037597656, -66.13311767578125, -58.2712287902832, -50.409339904785156, -42.547447204589844, -34.68555450439453, -26.823665618896484, -18.961776733398438, -11.099885940551758, -3.2379941940307617, 4.623897552490234, 12.485788345336914, 20.347679138183594, 28.209571838378906, 36.07146072387695, 43.933353424072266, 51.79524612426758, 59.657135009765625, 67.51902770996094, 75.38092041015625, 83.24281311035156, 91.10470581054688, 98.96659088134766, 106.82848358154297, 114.69037628173828, 122.5522689819336, 130.41415405273438, 138.2760467529297, 146.137939453125, 153.9998321533203, 161.86172485351562, 169.72361755371094, 177.58551025390625, 185.44740295410156, 193.30929565429688, 201.1711883544922, 209.0330810546875, 216.89495849609375, 224.75685119628906, 232.61874389648438]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 12.0, 7.0, 12.0, 20.0, 40.0, 50.0, 83.0, 155.0, 267.0, 543.0, 1181.0, 3285.0, 13670.0, 3956652.0, 202708.0, 10811.0, 2678.0, 984.0, 468.0, 232.0, 143.0, 86.0, 63.0, 37.0, 25.0, 14.0, 12.0, 10.0, 12.0, 4.0, 7.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.65625, -50.25537109375, -47.8544921875, -45.45361328125, -43.052734375, -40.65185546875, -38.2509765625, -35.85009765625, -33.44921875, -31.04833984375, -28.6474609375, -26.24658203125, -23.845703125, -21.44482421875, -19.0439453125, -16.64306640625, -14.2421875, -11.84130859375, -9.4404296875, -7.03955078125, -4.638671875, -2.23779296875, 0.1630859375, 2.56396484375, 4.96484375, 7.36572265625, 9.7666015625, 12.16748046875, 14.568359375, 16.96923828125, 19.3701171875, 21.77099609375, 24.171875, 26.57275390625, 28.9736328125, 31.37451171875, 33.775390625, 36.17626953125, 38.5771484375, 40.97802734375, 43.37890625, 45.77978515625, 48.1806640625, 50.58154296875, 52.982421875, 55.38330078125, 57.7841796875, 60.18505859375, 62.5859375, 64.98681640625, 67.3876953125, 69.78857421875, 72.189453125, 74.59033203125, 76.9912109375, 79.39208984375, 81.79296875, 84.19384765625, 86.5947265625, 88.99560546875, 91.396484375, 93.79736328125, 96.1982421875, 98.59912109375, 101.0]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 4.0, 2.0, 7.0, 6.0, 9.0, 12.0, 17.0, 31.0, 54.0, 44.0, 63.0, 87.0, 91.0, 88.0, 106.0, 95.0, 76.0, 42.0, 41.0, 34.0, 19.0, 22.0, 15.0, 7.0, 6.0, 1.0, 6.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.09375, -15.5546875, -15.015625, -14.4765625, -13.9375, -13.3984375, -12.859375, -12.3203125, -11.78125, -11.2421875, -10.703125, -10.1640625, -9.625, -9.0859375, -8.546875, -8.0078125, -7.46875, -6.9296875, -6.390625, -5.8515625, -5.3125, -4.7734375, -4.234375, -3.6953125, -3.15625, -2.6171875, -2.078125, -1.5390625, -1.0, -0.4609375, 0.078125, 0.6171875, 1.15625, 1.6953125, 2.234375, 2.7734375, 3.3125, 3.8515625, 4.390625, 4.9296875, 5.46875, 6.0078125, 6.546875, 7.0859375, 7.625, 8.1640625, 8.703125, 9.2421875, 9.78125, 10.3203125, 10.859375, 11.3984375, 11.9375, 12.4765625, 13.015625, 13.5546875, 14.09375, 14.6328125, 15.171875, 15.7109375, 16.25, 16.7890625, 17.328125, 17.8671875, 18.40625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 4.0, 6.0, 6.0, 8.0, 8.0, 17.0, 14.0, 9.0, 20.0, 22.0, 27.0, 29.0, 56.0, 79.0, 151.0, 344.0, 999.0, 4046.0, 34707.0, 4102279.0, 44798.0, 4788.0, 1050.0, 349.0, 137.0, 81.0, 52.0, 35.0, 26.0, 36.0, 20.0, 18.0, 18.0, 8.0, 10.0, 7.0, 7.0, 4.0, 3.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-122.9375, -119.748046875, -116.55859375, -113.369140625, -110.1796875, -106.990234375, -103.80078125, -100.611328125, -97.421875, -94.232421875, -91.04296875, -87.853515625, -84.6640625, -81.474609375, -78.28515625, -75.095703125, -71.90625, -68.716796875, -65.52734375, -62.337890625, -59.1484375, -55.958984375, -52.76953125, -49.580078125, -46.390625, -43.201171875, -40.01171875, -36.822265625, -33.6328125, -30.443359375, -27.25390625, -24.064453125, -20.875, -17.685546875, -14.49609375, -11.306640625, -8.1171875, -4.927734375, -1.73828125, 1.451171875, 4.640625, 7.830078125, 11.01953125, 14.208984375, 17.3984375, 20.587890625, 23.77734375, 26.966796875, 30.15625, 33.345703125, 36.53515625, 39.724609375, 42.9140625, 46.103515625, 49.29296875, 52.482421875, 55.671875, 58.861328125, 62.05078125, 65.240234375, 68.4296875, 71.619140625, 74.80859375, 77.998046875, 81.1875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 10.0, 10.0, 28.0, 56.0, 233.0, 3550.0, 110.0, 45.0, 25.0, 8.0, 6.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-85.6875, -84.080078125, -82.47265625, -80.865234375, -79.2578125, -77.650390625, -76.04296875, -74.435546875, -72.828125, -71.220703125, -69.61328125, -68.005859375, -66.3984375, -64.791015625, -63.18359375, -61.576171875, -59.96875, -58.361328125, -56.75390625, -55.146484375, -53.5390625, -51.931640625, -50.32421875, -48.716796875, -47.109375, -45.501953125, -43.89453125, -42.287109375, -40.6796875, -39.072265625, -37.46484375, -35.857421875, -34.25, -32.642578125, -31.03515625, -29.427734375, -27.8203125, -26.212890625, -24.60546875, -22.998046875, -21.390625, -19.783203125, -18.17578125, -16.568359375, -14.9609375, -13.353515625, -11.74609375, -10.138671875, -8.53125, -6.923828125, -5.31640625, -3.708984375, -2.1015625, -0.494140625, 1.11328125, 2.720703125, 4.328125, 5.935546875, 7.54296875, 9.150390625, 10.7578125, 12.365234375, 13.97265625, 15.580078125, 17.1875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 16.0, 43.0, 119.0, 248.0, 275.0, 190.0, 61.0, 36.0, 9.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-300.34161376953125, -293.5458984375, -286.75018310546875, -279.9544677734375, -273.15875244140625, -266.363037109375, -259.56732177734375, -252.77159118652344, -245.97586059570312, -239.18014526367188, -232.38442993164062, -225.58871459960938, -218.79298400878906, -211.9972686767578, -205.20155334472656, -198.4058380126953, -191.61012268066406, -184.8144073486328, -178.01869201660156, -171.22296142578125, -164.42724609375, -157.63153076171875, -150.8358154296875, -144.04010009765625, -137.244384765625, -130.44866943359375, -123.65294647216797, -116.85723114013672, -110.06150817871094, -103.26579284667969, -96.47007751464844, -89.67436218261719, -82.87861633300781, -76.08290100097656, -69.28717803955078, -62.49146270751953, -55.695743560791016, -48.9000244140625, -42.10430908203125, -35.308589935302734, -28.51287078857422, -21.717151641845703, -14.92143440246582, -8.125717163085938, -1.3299980163574219, 5.465721130371094, 12.261436462402344, 19.05715560913086, 25.852874755859375, 32.64859390258789, 39.444313049316406, 46.240028381347656, 53.03574752807617, 59.83146667480469, 66.62718200683594, 73.42289733886719, 80.21862030029297, 87.01433563232422, 93.81005859375, 100.60577392578125, 107.4014892578125, 114.19721221923828, 120.99292755126953, 127.78865051269531, 134.58436584472656]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 11.0, 18.0, 36.0, 46.0, 69.0, 78.0, 77.0, 121.0, 107.0, 102.0, 98.0, 72.0, 48.0, 39.0, 27.0, 15.0, 14.0, 5.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-131.0882568359375, -126.77546691894531, -122.46267700195312, -118.14988708496094, -113.83709716796875, -109.52430725097656, -105.21151733398438, -100.89872741699219, -96.5859375, -92.27314758300781, -87.96035766601562, -83.64756774902344, -79.33477783203125, -75.02198791503906, -70.70919799804688, -66.39640808105469, -62.0836181640625, -57.77082824707031, -53.458038330078125, -49.14524841308594, -44.83245849609375, -40.51966857910156, -36.206878662109375, -31.894088745117188, -27.581298828125, -23.268508911132812, -18.955718994140625, -14.642929077148438, -10.33013916015625, -6.0173492431640625, -1.704559326171875, 2.6082305908203125, 6.9210052490234375, 11.233795166015625, 15.546585083007812, 19.859375, 24.172164916992188, 28.484954833984375, 32.79774475097656, 37.11053466796875, 41.42332458496094, 45.736114501953125, 50.04890441894531, 54.3616943359375, 58.67448425292969, 62.987274169921875, 67.30006408691406, 71.61285400390625, 75.92564392089844, 80.23843383789062, 84.55122375488281, 88.864013671875, 93.17680358886719, 97.48959350585938, 101.80238342285156, 106.11517333984375, 110.42796325683594, 114.74075317382812, 119.05354309082031, 123.3663330078125, 127.67912292480469, 131.99191284179688, 136.30470275878906, 140.61749267578125, 144.93028259277344]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 5.0, 3.0, 5.0, 5.0, 14.0, 11.0, 12.0, 10.0, 26.0, 34.0, 43.0, 69.0, 79.0, 150.0, 206.0, 316.0, 530.0, 836.0, 1461.0, 2697.0, 5481.0, 12244.0, 31608.0, 93060.0, 274296.0, 378082.0, 159066.0, 52464.0, 18937.0, 7994.0, 3827.0, 2065.0, 1119.0, 627.0, 401.0, 254.0, 175.0, 100.0, 74.0, 40.0, 40.0, 30.0, 19.0, 11.0, 9.0, 12.0, 3.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-32.46875, -31.54736328125, -30.6259765625, -29.70458984375, -28.783203125, -27.86181640625, -26.9404296875, -26.01904296875, -25.09765625, -24.17626953125, -23.2548828125, -22.33349609375, -21.412109375, -20.49072265625, -19.5693359375, -18.64794921875, -17.7265625, -16.80517578125, -15.8837890625, -14.96240234375, -14.041015625, -13.11962890625, -12.1982421875, -11.27685546875, -10.35546875, -9.43408203125, -8.5126953125, -7.59130859375, -6.669921875, -5.74853515625, -4.8271484375, -3.90576171875, -2.984375, -2.06298828125, -1.1416015625, -0.22021484375, 0.701171875, 1.62255859375, 2.5439453125, 3.46533203125, 4.38671875, 5.30810546875, 6.2294921875, 7.15087890625, 8.072265625, 8.99365234375, 9.9150390625, 10.83642578125, 11.7578125, 12.67919921875, 13.6005859375, 14.52197265625, 15.443359375, 16.36474609375, 17.2861328125, 18.20751953125, 19.12890625, 20.05029296875, 20.9716796875, 21.89306640625, 22.814453125, 23.73583984375, 24.6572265625, 25.57861328125, 26.5]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 1.0, 6.0, 4.0, 9.0, 13.0, 19.0, 12.0, 17.0, 28.0, 37.0, 49.0, 52.0, 52.0, 71.0, 72.0, 54.0, 72.0, 58.0, 74.0, 54.0, 56.0, 40.0, 30.0, 26.0, 21.0, 10.0, 12.0, 15.0, 7.0, 9.0, 5.0, 6.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.453125, -13.953857421875, -13.45458984375, -12.955322265625, -12.4560546875, -11.956787109375, -11.45751953125, -10.958251953125, -10.458984375, -9.959716796875, -9.46044921875, -8.961181640625, -8.4619140625, -7.962646484375, -7.46337890625, -6.964111328125, -6.46484375, -5.965576171875, -5.46630859375, -4.967041015625, -4.4677734375, -3.968505859375, -3.46923828125, -2.969970703125, -2.470703125, -1.971435546875, -1.47216796875, -0.972900390625, -0.4736328125, 0.025634765625, 0.52490234375, 1.024169921875, 1.5234375, 2.022705078125, 2.52197265625, 3.021240234375, 3.5205078125, 4.019775390625, 4.51904296875, 5.018310546875, 5.517578125, 6.016845703125, 6.51611328125, 7.015380859375, 7.5146484375, 8.013916015625, 8.51318359375, 9.012451171875, 9.51171875, 10.010986328125, 10.51025390625, 11.009521484375, 11.5087890625, 12.008056640625, 12.50732421875, 13.006591796875, 13.505859375, 14.005126953125, 14.50439453125, 15.003662109375, 15.5029296875, 16.002197265625, 16.50146484375, 17.000732421875, 17.5]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 7.0, 24.0, 28.0, 44.0, 54.0, 95.0, 134.0, 238.0, 446.0, 907.0, 2235.0, 7070.0, 42982.0, 644672.0, 318690.0, 22775.0, 4834.0, 1691.0, 713.0, 348.0, 194.0, 140.0, 81.0, 48.0, 32.0, 18.0, 12.0, 12.0, 8.0, 4.0, 5.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.5, -66.1259765625, -63.751953125, -61.3779296875, -59.00390625, -56.6298828125, -54.255859375, -51.8818359375, -49.5078125, -47.1337890625, -44.759765625, -42.3857421875, -40.01171875, -37.6376953125, -35.263671875, -32.8896484375, -30.515625, -28.1416015625, -25.767578125, -23.3935546875, -21.01953125, -18.6455078125, -16.271484375, -13.8974609375, -11.5234375, -9.1494140625, -6.775390625, -4.4013671875, -2.02734375, 0.3466796875, 2.720703125, 5.0947265625, 7.46875, 9.8427734375, 12.216796875, 14.5908203125, 16.96484375, 19.3388671875, 21.712890625, 24.0869140625, 26.4609375, 28.8349609375, 31.208984375, 33.5830078125, 35.95703125, 38.3310546875, 40.705078125, 43.0791015625, 45.453125, 47.8271484375, 50.201171875, 52.5751953125, 54.94921875, 57.3232421875, 59.697265625, 62.0712890625, 64.4453125, 66.8193359375, 69.193359375, 71.5673828125, 73.94140625, 76.3154296875, 78.689453125, 81.0634765625, 83.4375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 3.0, 3.0, 1.0, 8.0, 10.0, 7.0, 15.0, 32.0, 52.0, 52.0, 107.0, 96.0, 108.0, 111.0, 104.0, 82.0, 71.0, 51.0, 30.0, 19.0, 12.0, 10.0, 5.0, 5.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-160.875, -156.9453125, -153.015625, -149.0859375, -145.15625, -141.2265625, -137.296875, -133.3671875, -129.4375, -125.5078125, -121.578125, -117.6484375, -113.71875, -109.7890625, -105.859375, -101.9296875, -98.0, -94.0703125, -90.140625, -86.2109375, -82.28125, -78.3515625, -74.421875, -70.4921875, -66.5625, -62.6328125, -58.703125, -54.7734375, -50.84375, -46.9140625, -42.984375, -39.0546875, -35.125, -31.1953125, -27.265625, -23.3359375, -19.40625, -15.4765625, -11.546875, -7.6171875, -3.6875, 0.2421875, 4.171875, 8.1015625, 12.03125, 15.9609375, 19.890625, 23.8203125, 27.75, 31.6796875, 35.609375, 39.5390625, 43.46875, 47.3984375, 51.328125, 55.2578125, 59.1875, 63.1171875, 67.046875, 70.9765625, 74.90625, 78.8359375, 82.765625, 86.6953125, 90.625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 2.0, 6.0, 8.0, 15.0, 8.0, 13.0, 31.0, 34.0, 46.0, 86.0, 155.0, 250.0, 718.0, 3054.0, 52691.0, 965994.0, 22273.0, 2036.0, 520.0, 220.0, 127.0, 73.0, 53.0, 34.0, 32.0, 20.0, 12.0, 9.0, 12.0, 7.0, 6.0, 2.0, 6.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-69.4375, -67.529296875, -65.62109375, -63.712890625, -61.8046875, -59.896484375, -57.98828125, -56.080078125, -54.171875, -52.263671875, -50.35546875, -48.447265625, -46.5390625, -44.630859375, -42.72265625, -40.814453125, -38.90625, -36.998046875, -35.08984375, -33.181640625, -31.2734375, -29.365234375, -27.45703125, -25.548828125, -23.640625, -21.732421875, -19.82421875, -17.916015625, -16.0078125, -14.099609375, -12.19140625, -10.283203125, -8.375, -6.466796875, -4.55859375, -2.650390625, -0.7421875, 1.166015625, 3.07421875, 4.982421875, 6.890625, 8.798828125, 10.70703125, 12.615234375, 14.5234375, 16.431640625, 18.33984375, 20.248046875, 22.15625, 24.064453125, 25.97265625, 27.880859375, 29.7890625, 31.697265625, 33.60546875, 35.513671875, 37.421875, 39.330078125, 41.23828125, 43.146484375, 45.0546875, 46.962890625, 48.87109375, 50.779296875, 52.6875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 4.0, 2.0, 7.0, 8.0, 17.0, 19.0, 17.0, 40.0, 46.0, 57.0, 109.0, 128.0, 111.0, 121.0, 87.0, 59.0, 46.0, 34.0, 24.0, 19.0, 10.0, 7.0, 6.0, 10.0, 4.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005672454833984375, -0.005527913570404053, -0.0053833723068237305, -0.005238831043243408, -0.005094289779663086, -0.004949748516082764, -0.004805207252502441, -0.004660665988922119, -0.004516124725341797, -0.004371583461761475, -0.004227042198181152, -0.00408250093460083, -0.003937959671020508, -0.0037934184074401855, -0.0036488771438598633, -0.003504335880279541, -0.0033597946166992188, -0.0032152533531188965, -0.0030707120895385742, -0.002926170825958252, -0.0027816295623779297, -0.0026370882987976074, -0.002492547035217285, -0.002348005771636963, -0.0022034645080566406, -0.0020589232444763184, -0.001914381980895996, -0.0017698407173156738, -0.0016252994537353516, -0.0014807581901550293, -0.001336216926574707, -0.0011916756629943848, -0.0010471343994140625, -0.0009025931358337402, -0.000758051872253418, -0.0006135106086730957, -0.00046896934509277344, -0.00032442808151245117, -0.0001798868179321289, -3.534555435180664e-05, 0.00010919570922851562, 0.0002537369728088379, 0.00039827823638916016, 0.0005428194999694824, 0.0006873607635498047, 0.000831902027130127, 0.0009764432907104492, 0.0011209845542907715, 0.0012655258178710938, 0.001410067081451416, 0.0015546083450317383, 0.0016991496086120605, 0.0018436908721923828, 0.001988232135772705, 0.0021327733993530273, 0.0022773146629333496, 0.002421855926513672, 0.002566397190093994, 0.0027109384536743164, 0.0028554797172546387, 0.003000020980834961, 0.003144562244415283, 0.0032891035079956055, 0.0034336447715759277, 0.00357818603515625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 6.0, 3.0, 6.0, 7.0, 18.0, 8.0, 17.0, 31.0, 35.0, 65.0, 98.0, 147.0, 292.0, 757.0, 2153.0, 9228.0, 208170.0, 805397.0, 17111.0, 3157.0, 927.0, 384.0, 199.0, 114.0, 77.0, 48.0, 28.0, 17.0, 12.0, 12.0, 11.0, 10.0, 6.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-64.4375, -62.703125, -60.96875, -59.234375, -57.5, -55.765625, -54.03125, -52.296875, -50.5625, -48.828125, -47.09375, -45.359375, -43.625, -41.890625, -40.15625, -38.421875, -36.6875, -34.953125, -33.21875, -31.484375, -29.75, -28.015625, -26.28125, -24.546875, -22.8125, -21.078125, -19.34375, -17.609375, -15.875, -14.140625, -12.40625, -10.671875, -8.9375, -7.203125, -5.46875, -3.734375, -2.0, -0.265625, 1.46875, 3.203125, 4.9375, 6.671875, 8.40625, 10.140625, 11.875, 13.609375, 15.34375, 17.078125, 18.8125, 20.546875, 22.28125, 24.015625, 25.75, 27.484375, 29.21875, 30.953125, 32.6875, 34.421875, 36.15625, 37.890625, 39.625, 41.359375, 43.09375, 44.828125, 46.5625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 9.0, 6.0, 16.0, 41.0, 108.0, 295.0, 283.0, 151.0, 45.0, 13.0, 9.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.125, -66.3642578125, -63.603515625, -60.8427734375, -58.08203125, -55.3212890625, -52.560546875, -49.7998046875, -47.0390625, -44.2783203125, -41.517578125, -38.7568359375, -35.99609375, -33.2353515625, -30.474609375, -27.7138671875, -24.953125, -22.1923828125, -19.431640625, -16.6708984375, -13.91015625, -11.1494140625, -8.388671875, -5.6279296875, -2.8671875, -0.1064453125, 2.654296875, 5.4150390625, 8.17578125, 10.9365234375, 13.697265625, 16.4580078125, 19.21875, 21.9794921875, 24.740234375, 27.5009765625, 30.26171875, 33.0224609375, 35.783203125, 38.5439453125, 41.3046875, 44.0654296875, 46.826171875, 49.5869140625, 52.34765625, 55.1083984375, 57.869140625, 60.6298828125, 63.390625, 66.1513671875, 68.912109375, 71.6728515625, 74.43359375, 77.1943359375, 79.955078125, 82.7158203125, 85.4765625, 88.2373046875, 90.998046875, 93.7587890625, 96.51953125, 99.2802734375, 102.041015625, 104.8017578125, 107.5625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 12.0, 55.0, 193.0, 422.0, 228.0, 59.0, 17.0, 11.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1013.239013671875, -975.0278930664062, -936.8167724609375, -898.605712890625, -860.3945922851562, -822.1834716796875, -783.9723510742188, -745.76123046875, -707.5501708984375, -669.3390502929688, -631.1279296875, -592.9168701171875, -554.7057495117188, -516.49462890625, -478.28350830078125, -440.0724182128906, -401.86126708984375, -363.650146484375, -325.4390563964844, -287.2279357910156, -249.01683044433594, -210.80572509765625, -172.5946044921875, -134.38351440429688, -96.17239379882812, -57.96128463745117, -19.75017547607422, 18.4609375, 56.67204284667969, 94.88314819335938, 133.09426879882812, 171.30535888671875, 209.5164794921875, 247.7275848388672, 285.9386901855469, 324.1498107910156, 362.36090087890625, 400.572021484375, 438.78314208984375, 476.9942321777344, 515.205322265625, 553.4164428710938, 591.6275634765625, 629.838623046875, 668.0497436523438, 706.2608642578125, 744.4719848632812, 782.68310546875, 820.8942260742188, 859.1053466796875, 897.3164672851562, 935.527587890625, 973.7386474609375, 1011.9497680664062, 1050.160888671875, 1088.3719482421875, 1126.5831298828125, 1164.794189453125, 1203.00537109375, 1241.2164306640625, 1279.4276123046875, 1317.638671875, 1355.849853515625, 1394.0609130859375, 1432.27197265625]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 8.0, 8.0, 12.0, 23.0, 22.0, 33.0, 36.0, 40.0, 49.0, 49.0, 59.0, 54.0, 64.0, 65.0, 57.0, 75.0, 64.0, 65.0, 44.0, 36.0, 32.0, 18.0, 23.0, 16.0, 16.0, 9.0, 7.0, 9.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-360.871337890625, -347.7733154296875, -334.6752624511719, -321.5772399902344, -308.47918701171875, -295.38116455078125, -282.28314208984375, -269.1850891113281, -256.0870361328125, -242.98899841308594, -229.89096069335938, -216.79293823242188, -203.69488525390625, -190.59686279296875, -177.4988250732422, -164.40078735351562, -151.30276489257812, -138.20472717285156, -125.106689453125, -112.00865936279297, -98.9106216430664, -85.81258392333984, -72.71455383300781, -59.61651611328125, -46.51847839355469, -33.420440673828125, -20.322406768798828, -7.224372863769531, 5.873664855957031, 18.971702575683594, 32.069732666015625, 45.16777038574219, 58.26580810546875, 71.36384582519531, 84.46188354492188, 97.5599136352539, 110.65795135498047, 123.75598907470703, 136.85401916503906, 149.95205688476562, 163.0500946044922, 176.14813232421875, 189.2461700439453, 202.34420776367188, 215.44223022460938, 228.540283203125, 241.6383056640625, 254.73634338378906, 267.8343811035156, 280.9324035644531, 294.03045654296875, 307.12847900390625, 320.2265319824219, 333.3245544433594, 346.422607421875, 359.5206298828125, 372.61865234375, 385.7166748046875, 398.8147277832031, 411.9127502441406, 425.01080322265625, 438.10882568359375, 451.20684814453125, 464.3049011230469, 477.4029541015625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 2.0, 5.0, 12.0, 9.0, 14.0, 21.0, 25.0, 59.0, 71.0, 134.0, 253.0, 468.0, 939.0, 1983.0, 4988.0, 14559.0, 59517.0, 1510715.0, 2512189.0, 63711.0, 14776.0, 5111.0, 2255.0, 1004.0, 504.0, 309.0, 211.0, 113.0, 94.0, 56.0, 35.0, 30.0, 28.0, 12.0, 12.0, 12.0, 12.0, 5.0, 7.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-33.875, -32.57373046875, -31.2724609375, -29.97119140625, -28.669921875, -27.36865234375, -26.0673828125, -24.76611328125, -23.46484375, -22.16357421875, -20.8623046875, -19.56103515625, -18.259765625, -16.95849609375, -15.6572265625, -14.35595703125, -13.0546875, -11.75341796875, -10.4521484375, -9.15087890625, -7.849609375, -6.54833984375, -5.2470703125, -3.94580078125, -2.64453125, -1.34326171875, -0.0419921875, 1.25927734375, 2.560546875, 3.86181640625, 5.1630859375, 6.46435546875, 7.765625, 9.06689453125, 10.3681640625, 11.66943359375, 12.970703125, 14.27197265625, 15.5732421875, 16.87451171875, 18.17578125, 19.47705078125, 20.7783203125, 22.07958984375, 23.380859375, 24.68212890625, 25.9833984375, 27.28466796875, 28.5859375, 29.88720703125, 31.1884765625, 32.48974609375, 33.791015625, 35.09228515625, 36.3935546875, 37.69482421875, 38.99609375, 40.29736328125, 41.5986328125, 42.89990234375, 44.201171875, 45.50244140625, 46.8037109375, 48.10498046875, 49.40625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 8.0, 8.0, 13.0, 23.0, 31.0, 39.0, 64.0, 77.0, 95.0, 87.0, 109.0, 107.0, 83.0, 73.0, 55.0, 45.0, 30.0, 15.0, 14.0, 13.0, 3.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.109375, -17.401123046875, -16.69287109375, -15.984619140625, -15.2763671875, -14.568115234375, -13.85986328125, -13.151611328125, -12.443359375, -11.735107421875, -11.02685546875, -10.318603515625, -9.6103515625, -8.902099609375, -8.19384765625, -7.485595703125, -6.77734375, -6.069091796875, -5.36083984375, -4.652587890625, -3.9443359375, -3.236083984375, -2.52783203125, -1.819580078125, -1.111328125, -0.403076171875, 0.30517578125, 1.013427734375, 1.7216796875, 2.429931640625, 3.13818359375, 3.846435546875, 4.5546875, 5.262939453125, 5.97119140625, 6.679443359375, 7.3876953125, 8.095947265625, 8.80419921875, 9.512451171875, 10.220703125, 10.928955078125, 11.63720703125, 12.345458984375, 13.0537109375, 13.761962890625, 14.47021484375, 15.178466796875, 15.88671875, 16.594970703125, 17.30322265625, 18.011474609375, 18.7197265625, 19.427978515625, 20.13623046875, 20.844482421875, 21.552734375, 22.260986328125, 22.96923828125, 23.677490234375, 24.3857421875, 25.093994140625, 25.80224609375, 26.510498046875, 27.21875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 5.0, 3.0, 5.0, 7.0, 17.0, 27.0, 27.0, 58.0, 110.0, 256.0, 769.0, 2897.0, 15212.0, 203373.0, 3888631.0, 72513.0, 7815.0, 1627.0, 490.0, 214.0, 79.0, 48.0, 33.0, 13.0, 18.0, 8.0, 5.0, 2.0, 5.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.6875, -60.55078125, -58.4140625, -56.27734375, -54.140625, -52.00390625, -49.8671875, -47.73046875, -45.59375, -43.45703125, -41.3203125, -39.18359375, -37.046875, -34.91015625, -32.7734375, -30.63671875, -28.5, -26.36328125, -24.2265625, -22.08984375, -19.953125, -17.81640625, -15.6796875, -13.54296875, -11.40625, -9.26953125, -7.1328125, -4.99609375, -2.859375, -0.72265625, 1.4140625, 3.55078125, 5.6875, 7.82421875, 9.9609375, 12.09765625, 14.234375, 16.37109375, 18.5078125, 20.64453125, 22.78125, 24.91796875, 27.0546875, 29.19140625, 31.328125, 33.46484375, 35.6015625, 37.73828125, 39.875, 42.01171875, 44.1484375, 46.28515625, 48.421875, 50.55859375, 52.6953125, 54.83203125, 56.96875, 59.10546875, 61.2421875, 63.37890625, 65.515625, 67.65234375, 69.7890625, 71.92578125, 74.0625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 5.0, 4.0, 0.0, 7.0, 9.0, 9.0, 16.0, 20.0, 33.0, 49.0, 73.0, 116.0, 221.0, 788.0, 1696.0, 548.0, 197.0, 104.0, 54.0, 43.0, 24.0, 21.0, 11.0, 10.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.34375, -35.8095703125, -34.275390625, -32.7412109375, -31.20703125, -29.6728515625, -28.138671875, -26.6044921875, -25.0703125, -23.5361328125, -22.001953125, -20.4677734375, -18.93359375, -17.3994140625, -15.865234375, -14.3310546875, -12.796875, -11.2626953125, -9.728515625, -8.1943359375, -6.66015625, -5.1259765625, -3.591796875, -2.0576171875, -0.5234375, 1.0107421875, 2.544921875, 4.0791015625, 5.61328125, 7.1474609375, 8.681640625, 10.2158203125, 11.75, 13.2841796875, 14.818359375, 16.3525390625, 17.88671875, 19.4208984375, 20.955078125, 22.4892578125, 24.0234375, 25.5576171875, 27.091796875, 28.6259765625, 30.16015625, 31.6943359375, 33.228515625, 34.7626953125, 36.296875, 37.8310546875, 39.365234375, 40.8994140625, 42.43359375, 43.9677734375, 45.501953125, 47.0361328125, 48.5703125, 50.1044921875, 51.638671875, 53.1728515625, 54.70703125, 56.2412109375, 57.775390625, 59.3095703125, 60.84375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 5.0, 13.0, 30.0, 64.0, 148.0, 225.0, 234.0, 148.0, 71.0, 29.0, 7.0, 6.0, 4.0, 3.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-516.845947265625, -502.1072082519531, -487.36846923828125, -472.6297302246094, -457.8909912109375, -443.1522216796875, -428.41351318359375, -413.67474365234375, -398.9360046386719, -384.197265625, -369.4585266113281, -354.71978759765625, -339.9810485839844, -325.2423095703125, -310.5035400390625, -295.7648010253906, -281.02606201171875, -266.2873229980469, -251.548583984375, -236.80984497070312, -222.0710906982422, -207.3323516845703, -192.59361267089844, -177.8548583984375, -163.11614990234375, -148.37741088867188, -133.638671875, -118.8999252319336, -104.16117858886719, -89.42243957519531, -74.68370056152344, -59.94495391845703, -45.206207275390625, -30.467464447021484, -15.728723526000977, -0.9899826049804688, 13.748760223388672, 28.487503051757812, 43.22624206542969, 57.964988708496094, 72.70372772216797, 87.44246673583984, 102.18121337890625, 116.91995239257812, 131.65869140625, 146.39743041992188, 161.13616943359375, 175.8749237060547, 190.61366271972656, 205.35240173339844, 220.0911407470703, 234.82989501953125, 249.56863403320312, 264.307373046875, 279.0461120605469, 293.78485107421875, 308.5235900878906, 323.2623291015625, 338.0010681152344, 352.73980712890625, 367.4785461425781, 382.21728515625, 396.9560546875, 411.6947937011719, 426.43353271484375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 5.0, 12.0, 13.0, 18.0, 21.0, 14.0, 19.0, 18.0, 32.0, 49.0, 46.0, 57.0, 58.0, 58.0, 57.0, 70.0, 55.0, 54.0, 48.0, 55.0, 42.0, 39.0, 22.0, 19.0, 27.0, 23.0, 23.0, 12.0, 8.0, 3.0, 9.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-181.0891571044922, -174.58975219726562, -168.09036254882812, -161.59095764160156, -155.091552734375, -148.59214782714844, -142.09274291992188, -135.59335327148438, -129.0939483642578, -122.59454345703125, -116.09514617919922, -109.59574890136719, -103.09634399414062, -96.59693908691406, -90.09754180908203, -83.59814453125, -77.09873962402344, -70.59933471679688, -64.09993743896484, -57.60053634643555, -51.10113525390625, -44.60173416137695, -38.102333068847656, -31.60293197631836, -25.103530883789062, -18.604129791259766, -12.104728698730469, -5.605327606201172, 0.894073486328125, 7.393474578857422, 13.892875671386719, 20.392276763916016, 26.891677856445312, 33.39107894897461, 39.890480041503906, 46.3898811340332, 52.8892822265625, 59.3886833190918, 65.8880844116211, 72.38748168945312, 78.88688659667969, 85.38629150390625, 91.88568878173828, 98.38508605957031, 104.88449096679688, 111.38389587402344, 117.88329315185547, 124.3826904296875, 130.88209533691406, 137.38150024414062, 143.88088989257812, 150.3802947998047, 156.87969970703125, 163.3791046142578, 169.87850952148438, 176.37789916992188, 182.87730407714844, 189.376708984375, 195.8760986328125, 202.37550354003906, 208.87490844726562, 215.3743133544922, 221.87371826171875, 228.37310791015625, 234.8725128173828]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 5.0, 5.0, 8.0, 8.0, 14.0, 23.0, 24.0, 61.0, 116.0, 218.0, 430.0, 960.0, 2981.0, 12846.0, 94869.0, 684943.0, 219060.0, 24627.0, 4784.0, 1365.0, 576.0, 264.0, 142.0, 69.0, 49.0, 38.0, 29.0, 16.0, 7.0, 8.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.71875, -49.70458984375, -47.6904296875, -45.67626953125, -43.662109375, -41.64794921875, -39.6337890625, -37.61962890625, -35.60546875, -33.59130859375, -31.5771484375, -29.56298828125, -27.548828125, -25.53466796875, -23.5205078125, -21.50634765625, -19.4921875, -17.47802734375, -15.4638671875, -13.44970703125, -11.435546875, -9.42138671875, -7.4072265625, -5.39306640625, -3.37890625, -1.36474609375, 0.6494140625, 2.66357421875, 4.677734375, 6.69189453125, 8.7060546875, 10.72021484375, 12.734375, 14.74853515625, 16.7626953125, 18.77685546875, 20.791015625, 22.80517578125, 24.8193359375, 26.83349609375, 28.84765625, 30.86181640625, 32.8759765625, 34.89013671875, 36.904296875, 38.91845703125, 40.9326171875, 42.94677734375, 44.9609375, 46.97509765625, 48.9892578125, 51.00341796875, 53.017578125, 55.03173828125, 57.0458984375, 59.06005859375, 61.07421875, 63.08837890625, 65.1025390625, 67.11669921875, 69.130859375, 71.14501953125, 73.1591796875, 75.17333984375, 77.1875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 3.0, 7.0, 12.0, 21.0, 30.0, 36.0, 48.0, 78.0, 90.0, 95.0, 110.0, 112.0, 91.0, 69.0, 58.0, 47.0, 32.0, 28.0, 16.0, 13.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.03125, -17.303466796875, -16.57568359375, -15.847900390625, -15.1201171875, -14.392333984375, -13.66455078125, -12.936767578125, -12.208984375, -11.481201171875, -10.75341796875, -10.025634765625, -9.2978515625, -8.570068359375, -7.84228515625, -7.114501953125, -6.38671875, -5.658935546875, -4.93115234375, -4.203369140625, -3.4755859375, -2.747802734375, -2.02001953125, -1.292236328125, -0.564453125, 0.163330078125, 0.89111328125, 1.618896484375, 2.3466796875, 3.074462890625, 3.80224609375, 4.530029296875, 5.2578125, 5.985595703125, 6.71337890625, 7.441162109375, 8.1689453125, 8.896728515625, 9.62451171875, 10.352294921875, 11.080078125, 11.807861328125, 12.53564453125, 13.263427734375, 13.9912109375, 14.718994140625, 15.44677734375, 16.174560546875, 16.90234375, 17.630126953125, 18.35791015625, 19.085693359375, 19.8134765625, 20.541259765625, 21.26904296875, 21.996826171875, 22.724609375, 23.452392578125, 24.18017578125, 24.907958984375, 25.6357421875, 26.363525390625, 27.09130859375, 27.819091796875, 28.546875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 8.0, 5.0, 7.0, 6.0, 8.0, 19.0, 15.0, 25.0, 26.0, 35.0, 57.0, 90.0, 113.0, 175.0, 345.0, 569.0, 1211.0, 2847.0, 9073.0, 55011.0, 780151.0, 173707.0, 16713.0, 4652.0, 1769.0, 833.0, 393.0, 220.0, 142.0, 84.0, 69.0, 47.0, 28.0, 16.0, 23.0, 9.0, 19.0, 5.0, 6.0, 9.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-88.625, -86.0712890625, -83.517578125, -80.9638671875, -78.41015625, -75.8564453125, -73.302734375, -70.7490234375, -68.1953125, -65.6416015625, -63.087890625, -60.5341796875, -57.98046875, -55.4267578125, -52.873046875, -50.3193359375, -47.765625, -45.2119140625, -42.658203125, -40.1044921875, -37.55078125, -34.9970703125, -32.443359375, -29.8896484375, -27.3359375, -24.7822265625, -22.228515625, -19.6748046875, -17.12109375, -14.5673828125, -12.013671875, -9.4599609375, -6.90625, -4.3525390625, -1.798828125, 0.7548828125, 3.30859375, 5.8623046875, 8.416015625, 10.9697265625, 13.5234375, 16.0771484375, 18.630859375, 21.1845703125, 23.73828125, 26.2919921875, 28.845703125, 31.3994140625, 33.953125, 36.5068359375, 39.060546875, 41.6142578125, 44.16796875, 46.7216796875, 49.275390625, 51.8291015625, 54.3828125, 56.9365234375, 59.490234375, 62.0439453125, 64.59765625, 67.1513671875, 69.705078125, 72.2587890625, 74.8125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 4.0, 2.0, 5.0, 1.0, 2.0, 0.0, 6.0, 5.0, 5.0, 15.0, 18.0, 23.0, 29.0, 44.0, 61.0, 72.0, 86.0, 103.0, 106.0, 102.0, 75.0, 70.0, 44.0, 36.0, 27.0, 16.0, 7.0, 12.0, 9.0, 2.0, 3.0, 1.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-132.25, -128.4482421875, -124.646484375, -120.8447265625, -117.04296875, -113.2412109375, -109.439453125, -105.6376953125, -101.8359375, -98.0341796875, -94.232421875, -90.4306640625, -86.62890625, -82.8271484375, -79.025390625, -75.2236328125, -71.421875, -67.6201171875, -63.818359375, -60.0166015625, -56.21484375, -52.4130859375, -48.611328125, -44.8095703125, -41.0078125, -37.2060546875, -33.404296875, -29.6025390625, -25.80078125, -21.9990234375, -18.197265625, -14.3955078125, -10.59375, -6.7919921875, -2.990234375, 0.8115234375, 4.61328125, 8.4150390625, 12.216796875, 16.0185546875, 19.8203125, 23.6220703125, 27.423828125, 31.2255859375, 35.02734375, 38.8291015625, 42.630859375, 46.4326171875, 50.234375, 54.0361328125, 57.837890625, 61.6396484375, 65.44140625, 69.2431640625, 73.044921875, 76.8466796875, 80.6484375, 84.4501953125, 88.251953125, 92.0537109375, 95.85546875, 99.6572265625, 103.458984375, 107.2607421875, 111.0625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 2.0, 2.0, 3.0, 4.0, 16.0, 8.0, 9.0, 16.0, 15.0, 32.0, 52.0, 58.0, 108.0, 165.0, 276.0, 527.0, 1123.0, 3258.0, 14764.0, 209009.0, 776881.0, 33488.0, 5476.0, 1654.0, 693.0, 333.0, 185.0, 121.0, 82.0, 59.0, 33.0, 19.0, 20.0, 13.0, 16.0, 6.0, 5.0, 11.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.65625, -31.609375, -30.5625, -29.515625, -28.46875, -27.421875, -26.375, -25.328125, -24.28125, -23.234375, -22.1875, -21.140625, -20.09375, -19.046875, -18.0, -16.953125, -15.90625, -14.859375, -13.8125, -12.765625, -11.71875, -10.671875, -9.625, -8.578125, -7.53125, -6.484375, -5.4375, -4.390625, -3.34375, -2.296875, -1.25, -0.203125, 0.84375, 1.890625, 2.9375, 3.984375, 5.03125, 6.078125, 7.125, 8.171875, 9.21875, 10.265625, 11.3125, 12.359375, 13.40625, 14.453125, 15.5, 16.546875, 17.59375, 18.640625, 19.6875, 20.734375, 21.78125, 22.828125, 23.875, 24.921875, 25.96875, 27.015625, 28.0625, 29.109375, 30.15625, 31.203125, 32.25, 33.296875, 34.34375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 12.0, 9.0, 17.0, 12.0, 22.0, 37.0, 45.0, 50.0, 79.0, 141.0, 164.0, 135.0, 76.0, 56.0, 33.0, 27.0, 16.0, 13.0, 9.0, 11.0, 8.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00557708740234375, -0.0054357051849365234, -0.005294322967529297, -0.00515294075012207, -0.005011558532714844, -0.004870176315307617, -0.004728794097900391, -0.004587411880493164, -0.0044460296630859375, -0.004304647445678711, -0.004163265228271484, -0.004021883010864258, -0.0038805007934570312, -0.0037391185760498047, -0.003597736358642578, -0.0034563541412353516, -0.003314971923828125, -0.0031735897064208984, -0.003032207489013672, -0.0028908252716064453, -0.0027494430541992188, -0.002608060836791992, -0.0024666786193847656, -0.002325296401977539, -0.0021839141845703125, -0.002042531967163086, -0.0019011497497558594, -0.0017597675323486328, -0.0016183853149414062, -0.0014770030975341797, -0.0013356208801269531, -0.0011942386627197266, -0.0010528564453125, -0.0009114742279052734, -0.0007700920104980469, -0.0006287097930908203, -0.00048732757568359375, -0.0003459453582763672, -0.00020456314086914062, -6.318092346191406e-05, 7.82012939453125e-05, 0.00021958351135253906, 0.0003609657287597656, 0.0005023479461669922, 0.0006437301635742188, 0.0007851123809814453, 0.0009264945983886719, 0.0010678768157958984, 0.001209259033203125, 0.0013506412506103516, 0.0014920234680175781, 0.0016334056854248047, 0.0017747879028320312, 0.0019161701202392578, 0.0020575523376464844, 0.002198934555053711, 0.0023403167724609375, 0.002481698989868164, 0.0026230812072753906, 0.002764463424682617, 0.0029058456420898438, 0.0030472278594970703, 0.003188610076904297, 0.0033299922943115234, 0.00347137451171875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 4.0, 5.0, 4.0, 11.0, 12.0, 16.0, 34.0, 29.0, 49.0, 57.0, 84.0, 121.0, 216.0, 391.0, 825.0, 1882.0, 5529.0, 25349.0, 370559.0, 600827.0, 31973.0, 6455.0, 2110.0, 842.0, 449.0, 248.0, 148.0, 88.0, 59.0, 53.0, 34.0, 20.0, 23.0, 12.0, 10.0, 9.0, 2.0, 7.0, 2.0, 1.0, 5.0, 3.0, 0.0, 4.0], "bins": [-36.09375, -35.169677734375, -34.24560546875, -33.321533203125, -32.3974609375, -31.473388671875, -30.54931640625, -29.625244140625, -28.701171875, -27.777099609375, -26.85302734375, -25.928955078125, -25.0048828125, -24.080810546875, -23.15673828125, -22.232666015625, -21.30859375, -20.384521484375, -19.46044921875, -18.536376953125, -17.6123046875, -16.688232421875, -15.76416015625, -14.840087890625, -13.916015625, -12.991943359375, -12.06787109375, -11.143798828125, -10.2197265625, -9.295654296875, -8.37158203125, -7.447509765625, -6.5234375, -5.599365234375, -4.67529296875, -3.751220703125, -2.8271484375, -1.903076171875, -0.97900390625, -0.054931640625, 0.869140625, 1.793212890625, 2.71728515625, 3.641357421875, 4.5654296875, 5.489501953125, 6.41357421875, 7.337646484375, 8.26171875, 9.185791015625, 10.10986328125, 11.033935546875, 11.9580078125, 12.882080078125, 13.80615234375, 14.730224609375, 15.654296875, 16.578369140625, 17.50244140625, 18.426513671875, 19.3505859375, 20.274658203125, 21.19873046875, 22.122802734375, 23.046875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 9.0, 7.0, 11.0, 29.0, 34.0, 46.0, 68.0, 124.0, 138.0, 190.0, 119.0, 63.0, 51.0, 31.0, 22.0, 14.0, 8.0, 5.0, 5.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-39.09375, -37.87451171875, -36.6552734375, -35.43603515625, -34.216796875, -32.99755859375, -31.7783203125, -30.55908203125, -29.33984375, -28.12060546875, -26.9013671875, -25.68212890625, -24.462890625, -23.24365234375, -22.0244140625, -20.80517578125, -19.5859375, -18.36669921875, -17.1474609375, -15.92822265625, -14.708984375, -13.48974609375, -12.2705078125, -11.05126953125, -9.83203125, -8.61279296875, -7.3935546875, -6.17431640625, -4.955078125, -3.73583984375, -2.5166015625, -1.29736328125, -0.078125, 1.14111328125, 2.3603515625, 3.57958984375, 4.798828125, 6.01806640625, 7.2373046875, 8.45654296875, 9.67578125, 10.89501953125, 12.1142578125, 13.33349609375, 14.552734375, 15.77197265625, 16.9912109375, 18.21044921875, 19.4296875, 20.64892578125, 21.8681640625, 23.08740234375, 24.306640625, 25.52587890625, 26.7451171875, 27.96435546875, 29.18359375, 30.40283203125, 31.6220703125, 32.84130859375, 34.060546875, 35.27978515625, 36.4990234375, 37.71826171875, 38.9375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 12.0, 25.0, 73.0, 153.0, 257.0, 233.0, 131.0, 52.0, 33.0, 9.0, 7.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-403.8166809082031, -384.4425964355469, -365.0684814453125, -345.69439697265625, -326.3203125, -306.9461975097656, -287.5721130371094, -268.197998046875, -248.82391357421875, -229.44981384277344, -210.07571411132812, -190.70162963867188, -171.32752990722656, -151.95343017578125, -132.579345703125, -113.20524597167969, -93.83114624023438, -74.45704650878906, -55.08295440673828, -35.708858489990234, -16.334762573242188, 3.039337158203125, 22.413429260253906, 41.78752136230469, 61.16162109375, 80.53572082519531, 99.9098129272461, 119.28390502929688, 138.6580047607422, 158.0321044921875, 177.40618896484375, 196.78028869628906, 216.1544189453125, 235.5285186767578, 254.90261840820312, 274.2767028808594, 293.65081787109375, 313.02490234375, 332.39898681640625, 351.7730712890625, 371.1471862792969, 390.5212707519531, 409.8953857421875, 429.26947021484375, 448.6435546875, 468.0176696777344, 487.3917541503906, 506.765869140625, 526.1399536132812, 545.5140380859375, 564.8881225585938, 584.2622680664062, 603.6363525390625, 623.0104370117188, 642.384521484375, 661.7586059570312, 681.1326904296875, 700.5067749023438, 719.880859375, 739.2550048828125, 758.6290893554688, 778.003173828125, 797.3772583007812, 816.7513427734375, 836.12548828125]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 9.0, 2.0, 5.0, 6.0, 7.0, 12.0, 10.0, 15.0, 19.0, 16.0, 27.0, 24.0, 29.0, 35.0, 38.0, 46.0, 36.0, 51.0, 39.0, 52.0, 63.0, 48.0, 43.0, 53.0, 39.0, 33.0, 41.0, 27.0, 23.0, 24.0, 14.0, 19.0, 19.0, 8.0, 10.0, 12.0, 12.0, 12.0, 3.0, 6.0, 2.0, 4.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-240.06988525390625, -232.47193908691406, -224.87399291992188, -217.27603149414062, -209.67808532714844, -202.08013916015625, -194.48219299316406, -186.88424682617188, -179.28628540039062, -171.68833923339844, -164.09039306640625, -156.492431640625, -148.8944854736328, -141.29653930664062, -133.69859313964844, -126.10064697265625, -118.50270080566406, -110.90475463867188, -103.30680084228516, -95.70885467529297, -88.11090087890625, -80.51295471191406, -72.91500854492188, -65.31706237792969, -57.71910858154297, -50.121158599853516, -42.52320861816406, -34.925262451171875, -27.327312469482422, -19.72936248779297, -12.131416320800781, -4.533466339111328, 3.0644683837890625, 10.6624174118042, 18.260366439819336, 25.858314514160156, 33.45626449584961, 41.05421447753906, 48.65216064453125, 56.2501106262207, 63.848060607910156, 71.44600677490234, 79.04396057128906, 86.64190673828125, 94.23985290527344, 101.83780670166016, 109.43575286865234, 117.03370666503906, 124.63165283203125, 132.22959899902344, 139.82754516601562, 147.42550659179688, 155.02345275878906, 162.62139892578125, 170.21934509277344, 177.81729125976562, 185.41525268554688, 193.01319885253906, 200.61114501953125, 208.2091064453125, 215.8070526123047, 223.40499877929688, 231.00294494628906, 238.60089111328125, 246.19883728027344]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 9.0, 5.0, 13.0, 11.0, 13.0, 29.0, 45.0, 73.0, 149.0, 298.0, 741.0, 2058.0, 7707.0, 45891.0, 2964105.0, 1133306.0, 30931.0, 5684.0, 1769.0, 679.0, 278.0, 170.0, 105.0, 67.0, 38.0, 28.0, 17.0, 13.0, 14.0, 7.0, 5.0, 8.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-53.375, -51.88916015625, -50.4033203125, -48.91748046875, -47.431640625, -45.94580078125, -44.4599609375, -42.97412109375, -41.48828125, -40.00244140625, -38.5166015625, -37.03076171875, -35.544921875, -34.05908203125, -32.5732421875, -31.08740234375, -29.6015625, -28.11572265625, -26.6298828125, -25.14404296875, -23.658203125, -22.17236328125, -20.6865234375, -19.20068359375, -17.71484375, -16.22900390625, -14.7431640625, -13.25732421875, -11.771484375, -10.28564453125, -8.7998046875, -7.31396484375, -5.828125, -4.34228515625, -2.8564453125, -1.37060546875, 0.115234375, 1.60107421875, 3.0869140625, 4.57275390625, 6.05859375, 7.54443359375, 9.0302734375, 10.51611328125, 12.001953125, 13.48779296875, 14.9736328125, 16.45947265625, 17.9453125, 19.43115234375, 20.9169921875, 22.40283203125, 23.888671875, 25.37451171875, 26.8603515625, 28.34619140625, 29.83203125, 31.31787109375, 32.8037109375, 34.28955078125, 35.775390625, 37.26123046875, 38.7470703125, 40.23291015625, 41.71875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 11.0, 16.0, 22.0, 37.0, 56.0, 76.0, 101.0, 126.0, 151.0, 128.0, 79.0, 64.0, 58.0, 35.0, 16.0, 15.0, 5.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.984375, -20.126708984375, -19.26904296875, -18.411376953125, -17.5537109375, -16.696044921875, -15.83837890625, -14.980712890625, -14.123046875, -13.265380859375, -12.40771484375, -11.550048828125, -10.6923828125, -9.834716796875, -8.97705078125, -8.119384765625, -7.26171875, -6.404052734375, -5.54638671875, -4.688720703125, -3.8310546875, -2.973388671875, -2.11572265625, -1.258056640625, -0.400390625, 0.457275390625, 1.31494140625, 2.172607421875, 3.0302734375, 3.887939453125, 4.74560546875, 5.603271484375, 6.4609375, 7.318603515625, 8.17626953125, 9.033935546875, 9.8916015625, 10.749267578125, 11.60693359375, 12.464599609375, 13.322265625, 14.179931640625, 15.03759765625, 15.895263671875, 16.7529296875, 17.610595703125, 18.46826171875, 19.325927734375, 20.18359375, 21.041259765625, 21.89892578125, 22.756591796875, 23.6142578125, 24.471923828125, 25.32958984375, 26.187255859375, 27.044921875, 27.902587890625, 28.76025390625, 29.617919921875, 30.4755859375, 31.333251953125, 32.19091796875, 33.048583984375, 33.90625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 11.0, 9.0, 29.0, 37.0, 60.0, 104.0, 188.0, 400.0, 832.0, 1941.0, 4679.0, 13595.0, 48952.0, 337418.0, 3469189.0, 256771.0, 41132.0, 11815.0, 4108.0, 1616.0, 704.0, 327.0, 156.0, 83.0, 35.0, 24.0, 24.0, 9.0, 7.0, 7.0, 1.0, 6.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.59375, -31.58935546875, -30.5849609375, -29.58056640625, -28.576171875, -27.57177734375, -26.5673828125, -25.56298828125, -24.55859375, -23.55419921875, -22.5498046875, -21.54541015625, -20.541015625, -19.53662109375, -18.5322265625, -17.52783203125, -16.5234375, -15.51904296875, -14.5146484375, -13.51025390625, -12.505859375, -11.50146484375, -10.4970703125, -9.49267578125, -8.48828125, -7.48388671875, -6.4794921875, -5.47509765625, -4.470703125, -3.46630859375, -2.4619140625, -1.45751953125, -0.453125, 0.55126953125, 1.5556640625, 2.56005859375, 3.564453125, 4.56884765625, 5.5732421875, 6.57763671875, 7.58203125, 8.58642578125, 9.5908203125, 10.59521484375, 11.599609375, 12.60400390625, 13.6083984375, 14.61279296875, 15.6171875, 16.62158203125, 17.6259765625, 18.63037109375, 19.634765625, 20.63916015625, 21.6435546875, 22.64794921875, 23.65234375, 24.65673828125, 25.6611328125, 26.66552734375, 27.669921875, 28.67431640625, 29.6787109375, 30.68310546875, 31.6875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 3.0, 5.0, 9.0, 8.0, 10.0, 11.0, 15.0, 17.0, 21.0, 48.0, 45.0, 83.0, 121.0, 178.0, 382.0, 757.0, 1037.0, 579.0, 285.0, 149.0, 95.0, 52.0, 44.0, 29.0, 17.0, 16.0, 12.0, 11.0, 11.0, 6.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.53125, -31.58154296875, -30.6318359375, -29.68212890625, -28.732421875, -27.78271484375, -26.8330078125, -25.88330078125, -24.93359375, -23.98388671875, -23.0341796875, -22.08447265625, -21.134765625, -20.18505859375, -19.2353515625, -18.28564453125, -17.3359375, -16.38623046875, -15.4365234375, -14.48681640625, -13.537109375, -12.58740234375, -11.6376953125, -10.68798828125, -9.73828125, -8.78857421875, -7.8388671875, -6.88916015625, -5.939453125, -4.98974609375, -4.0400390625, -3.09033203125, -2.140625, -1.19091796875, -0.2412109375, 0.70849609375, 1.658203125, 2.60791015625, 3.5576171875, 4.50732421875, 5.45703125, 6.40673828125, 7.3564453125, 8.30615234375, 9.255859375, 10.20556640625, 11.1552734375, 12.10498046875, 13.0546875, 14.00439453125, 14.9541015625, 15.90380859375, 16.853515625, 17.80322265625, 18.7529296875, 19.70263671875, 20.65234375, 21.60205078125, 22.5517578125, 23.50146484375, 24.451171875, 25.40087890625, 26.3505859375, 27.30029296875, 28.25]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 2.0, 1.0, 1.0, 3.0, 4.0, 9.0, 14.0, 23.0, 45.0, 103.0, 191.0, 224.0, 190.0, 100.0, 44.0, 21.0, 16.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-464.05780029296875, -453.45294189453125, -442.84808349609375, -432.24322509765625, -421.63836669921875, -411.03350830078125, -400.42864990234375, -389.82379150390625, -379.21893310546875, -368.61407470703125, -358.00921630859375, -347.40435791015625, -336.79949951171875, -326.19464111328125, -315.58978271484375, -304.98492431640625, -294.38006591796875, -283.77520751953125, -273.17034912109375, -262.56549072265625, -251.96063232421875, -241.35577392578125, -230.75091552734375, -220.14605712890625, -209.54119873046875, -198.93634033203125, -188.33148193359375, -177.72662353515625, -167.12176513671875, -156.51690673828125, -145.91204833984375, -135.30718994140625, -124.70230102539062, -114.09744262695312, -103.49258422851562, -92.88772583007812, -82.28286743164062, -71.67800903320312, -61.073150634765625, -50.468292236328125, -39.863433837890625, -29.258575439453125, -18.653717041015625, -8.048858642578125, 2.555999755859375, 13.160858154296875, 23.765716552734375, 34.370574951171875, 44.975433349609375, 55.580291748046875, 66.18515014648438, 76.79000854492188, 87.39486694335938, 97.99972534179688, 108.60458374023438, 119.20944213867188, 129.81430053710938, 140.41915893554688, 151.02401733398438, 161.62887573242188, 172.23373413085938, 182.83859252929688, 193.44345092773438, 204.04830932617188, 214.65316772460938]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 6.0, 9.0, 7.0, 5.0, 12.0, 12.0, 15.0, 23.0, 14.0, 20.0, 24.0, 26.0, 28.0, 37.0, 44.0, 36.0, 47.0, 32.0, 50.0, 50.0, 44.0, 43.0, 64.0, 45.0, 54.0, 26.0, 35.0, 35.0, 27.0, 24.0, 23.0, 14.0, 11.0, 16.0, 14.0, 9.0, 9.0, 2.0, 2.0, 4.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-153.9849090576172, -149.89161682128906, -145.79830932617188, -141.70501708984375, -137.61172485351562, -133.5184326171875, -129.42514038085938, -125.33183288574219, -121.23854064941406, -117.14524841308594, -113.05194854736328, -108.95864868164062, -104.8653564453125, -100.77206420898438, -96.67876434326172, -92.58546447753906, -88.49217224121094, -84.39888000488281, -80.30558013916016, -76.2122802734375, -72.11898803710938, -68.02569580078125, -63.932395935058594, -59.8390998840332, -55.74580383300781, -51.65250778198242, -47.55921173095703, -43.46591567993164, -39.37261962890625, -35.27932357788086, -31.18602752685547, -27.092731475830078, -22.99945068359375, -18.90615463256836, -14.812858581542969, -10.719562530517578, -6.6262664794921875, -2.532970428466797, 1.5603256225585938, 5.653621673583984, 9.746917724609375, 13.840213775634766, 17.933509826660156, 22.026805877685547, 26.120101928710938, 30.213397979736328, 34.30669403076172, 38.39999008178711, 42.4932861328125, 46.58658218383789, 50.67987823486328, 54.77317428588867, 58.86647033691406, 62.95976638793945, 67.05306243896484, 71.1463623046875, 75.23965454101562, 79.33294677734375, 83.4262466430664, 87.51954650878906, 91.61283874511719, 95.70613098144531, 99.79943084716797, 103.89273071289062, 107.98602294921875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 4.0, 4.0, 8.0, 2.0, 13.0, 17.0, 25.0, 33.0, 57.0, 129.0, 206.0, 425.0, 895.0, 2313.0, 7286.0, 30059.0, 159980.0, 598871.0, 198854.0, 36223.0, 8637.0, 2601.0, 958.0, 409.0, 231.0, 130.0, 57.0, 36.0, 36.0, 16.0, 13.0, 12.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-41.0625, -39.67333984375, -38.2841796875, -36.89501953125, -35.505859375, -34.11669921875, -32.7275390625, -31.33837890625, -29.94921875, -28.56005859375, -27.1708984375, -25.78173828125, -24.392578125, -23.00341796875, -21.6142578125, -20.22509765625, -18.8359375, -17.44677734375, -16.0576171875, -14.66845703125, -13.279296875, -11.89013671875, -10.5009765625, -9.11181640625, -7.72265625, -6.33349609375, -4.9443359375, -3.55517578125, -2.166015625, -0.77685546875, 0.6123046875, 2.00146484375, 3.390625, 4.77978515625, 6.1689453125, 7.55810546875, 8.947265625, 10.33642578125, 11.7255859375, 13.11474609375, 14.50390625, 15.89306640625, 17.2822265625, 18.67138671875, 20.060546875, 21.44970703125, 22.8388671875, 24.22802734375, 25.6171875, 27.00634765625, 28.3955078125, 29.78466796875, 31.173828125, 32.56298828125, 33.9521484375, 35.34130859375, 36.73046875, 38.11962890625, 39.5087890625, 40.89794921875, 42.287109375, 43.67626953125, 45.0654296875, 46.45458984375, 47.84375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 14.0, 21.0, 21.0, 37.0, 71.0, 80.0, 120.0, 121.0, 122.0, 109.0, 73.0, 71.0, 50.0, 28.0, 21.0, 24.0, 8.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.5625, -18.720703125, -17.87890625, -17.037109375, -16.1953125, -15.353515625, -14.51171875, -13.669921875, -12.828125, -11.986328125, -11.14453125, -10.302734375, -9.4609375, -8.619140625, -7.77734375, -6.935546875, -6.09375, -5.251953125, -4.41015625, -3.568359375, -2.7265625, -1.884765625, -1.04296875, -0.201171875, 0.640625, 1.482421875, 2.32421875, 3.166015625, 4.0078125, 4.849609375, 5.69140625, 6.533203125, 7.375, 8.216796875, 9.05859375, 9.900390625, 10.7421875, 11.583984375, 12.42578125, 13.267578125, 14.109375, 14.951171875, 15.79296875, 16.634765625, 17.4765625, 18.318359375, 19.16015625, 20.001953125, 20.84375, 21.685546875, 22.52734375, 23.369140625, 24.2109375, 25.052734375, 25.89453125, 26.736328125, 27.578125, 28.419921875, 29.26171875, 30.103515625, 30.9453125, 31.787109375, 32.62890625, 33.470703125, 34.3125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 11.0, 14.0, 12.0, 21.0, 41.0, 44.0, 108.0, 202.0, 460.0, 1103.0, 3288.0, 16234.0, 208531.0, 757390.0, 51575.0, 6427.0, 1736.0, 718.0, 302.0, 146.0, 83.0, 35.0, 27.0, 20.0, 10.0, 5.0, 3.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.25, -71.8740234375, -69.498046875, -67.1220703125, -64.74609375, -62.3701171875, -59.994140625, -57.6181640625, -55.2421875, -52.8662109375, -50.490234375, -48.1142578125, -45.73828125, -43.3623046875, -40.986328125, -38.6103515625, -36.234375, -33.8583984375, -31.482421875, -29.1064453125, -26.73046875, -24.3544921875, -21.978515625, -19.6025390625, -17.2265625, -14.8505859375, -12.474609375, -10.0986328125, -7.72265625, -5.3466796875, -2.970703125, -0.5947265625, 1.78125, 4.1572265625, 6.533203125, 8.9091796875, 11.28515625, 13.6611328125, 16.037109375, 18.4130859375, 20.7890625, 23.1650390625, 25.541015625, 27.9169921875, 30.29296875, 32.6689453125, 35.044921875, 37.4208984375, 39.796875, 42.1728515625, 44.548828125, 46.9248046875, 49.30078125, 51.6767578125, 54.052734375, 56.4287109375, 58.8046875, 61.1806640625, 63.556640625, 65.9326171875, 68.30859375, 70.6845703125, 73.060546875, 75.4365234375, 77.8125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 14.0, 11.0, 11.0, 18.0, 32.0, 33.0, 46.0, 48.0, 57.0, 68.0, 74.0, 66.0, 69.0, 62.0, 65.0, 76.0, 54.0, 42.0, 43.0, 28.0, 15.0, 22.0, 17.0, 13.0, 7.0, 7.0, 0.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-101.375, -99.0302734375, -96.685546875, -94.3408203125, -91.99609375, -89.6513671875, -87.306640625, -84.9619140625, -82.6171875, -80.2724609375, -77.927734375, -75.5830078125, -73.23828125, -70.8935546875, -68.548828125, -66.2041015625, -63.859375, -61.5146484375, -59.169921875, -56.8251953125, -54.48046875, -52.1357421875, -49.791015625, -47.4462890625, -45.1015625, -42.7568359375, -40.412109375, -38.0673828125, -35.72265625, -33.3779296875, -31.033203125, -28.6884765625, -26.34375, -23.9990234375, -21.654296875, -19.3095703125, -16.96484375, -14.6201171875, -12.275390625, -9.9306640625, -7.5859375, -5.2412109375, -2.896484375, -0.5517578125, 1.79296875, 4.1376953125, 6.482421875, 8.8271484375, 11.171875, 13.5166015625, 15.861328125, 18.2060546875, 20.55078125, 22.8955078125, 25.240234375, 27.5849609375, 29.9296875, 32.2744140625, 34.619140625, 36.9638671875, 39.30859375, 41.6533203125, 43.998046875, 46.3427734375, 48.6875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 10.0, 6.0, 13.0, 21.0, 35.0, 58.0, 127.0, 337.0, 1030.0, 5808.0, 101480.0, 887227.0, 47342.0, 3792.0, 772.0, 246.0, 102.0, 60.0, 28.0, 21.0, 17.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.359375, -27.360595703125, -26.36181640625, -25.363037109375, -24.3642578125, -23.365478515625, -22.36669921875, -21.367919921875, -20.369140625, -19.370361328125, -18.37158203125, -17.372802734375, -16.3740234375, -15.375244140625, -14.37646484375, -13.377685546875, -12.37890625, -11.380126953125, -10.38134765625, -9.382568359375, -8.3837890625, -7.385009765625, -6.38623046875, -5.387451171875, -4.388671875, -3.389892578125, -2.39111328125, -1.392333984375, -0.3935546875, 0.605224609375, 1.60400390625, 2.602783203125, 3.6015625, 4.600341796875, 5.59912109375, 6.597900390625, 7.5966796875, 8.595458984375, 9.59423828125, 10.593017578125, 11.591796875, 12.590576171875, 13.58935546875, 14.588134765625, 15.5869140625, 16.585693359375, 17.58447265625, 18.583251953125, 19.58203125, 20.580810546875, 21.57958984375, 22.578369140625, 23.5771484375, 24.575927734375, 25.57470703125, 26.573486328125, 27.572265625, 28.571044921875, 29.56982421875, 30.568603515625, 31.5673828125, 32.566162109375, 33.56494140625, 34.563720703125, 35.5625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 7.0, 2.0, 9.0, 11.0, 15.0, 11.0, 13.0, 11.0, 32.0, 31.0, 48.0, 53.0, 50.0, 78.0, 79.0, 91.0, 81.0, 68.0, 53.0, 44.0, 37.0, 26.0, 27.0, 23.0, 17.0, 11.0, 16.0, 9.0, 13.0, 9.0, 5.0, 2.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.0029621124267578125, -0.002879112958908081, -0.0027961134910583496, -0.002713114023208618, -0.0026301145553588867, -0.0025471150875091553, -0.002464115619659424, -0.0023811161518096924, -0.002298116683959961, -0.0022151172161102295, -0.002132117748260498, -0.0020491182804107666, -0.001966118812561035, -0.0018831193447113037, -0.0018001198768615723, -0.0017171204090118408, -0.0016341209411621094, -0.001551121473312378, -0.0014681220054626465, -0.001385122537612915, -0.0013021230697631836, -0.0012191236019134521, -0.0011361241340637207, -0.0010531246662139893, -0.0009701251983642578, -0.0008871257305145264, -0.0008041262626647949, -0.0007211267948150635, -0.000638127326965332, -0.0005551278591156006, -0.00047212839126586914, -0.0003891289234161377, -0.00030612945556640625, -0.0002231299877166748, -0.00014013051986694336, -5.7131052017211914e-05, 2.586841583251953e-05, 0.00010886788368225098, 0.00019186735153198242, 0.00027486681938171387, 0.0003578662872314453, 0.00044086575508117676, 0.0005238652229309082, 0.0006068646907806396, 0.0006898641586303711, 0.0007728636264801025, 0.000855863094329834, 0.0009388625621795654, 0.0010218620300292969, 0.0011048614978790283, 0.0011878609657287598, 0.0012708604335784912, 0.0013538599014282227, 0.001436859369277954, 0.0015198588371276855, 0.001602858304977417, 0.0016858577728271484, 0.0017688572406768799, 0.0018518567085266113, 0.0019348561763763428, 0.0020178556442260742, 0.0021008551120758057, 0.002183854579925537, 0.0022668540477752686, 0.002349853515625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 5.0, 17.0, 10.0, 17.0, 34.0, 59.0, 113.0, 179.0, 317.0, 629.0, 1488.0, 4237.0, 17522.0, 149690.0, 742811.0, 110849.0, 14417.0, 3628.0, 1330.0, 536.0, 266.0, 154.0, 74.0, 51.0, 35.0, 24.0, 16.0, 13.0, 9.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.03125, -16.432373046875, -15.83349609375, -15.234619140625, -14.6357421875, -14.036865234375, -13.43798828125, -12.839111328125, -12.240234375, -11.641357421875, -11.04248046875, -10.443603515625, -9.8447265625, -9.245849609375, -8.64697265625, -8.048095703125, -7.44921875, -6.850341796875, -6.25146484375, -5.652587890625, -5.0537109375, -4.454833984375, -3.85595703125, -3.257080078125, -2.658203125, -2.059326171875, -1.46044921875, -0.861572265625, -0.2626953125, 0.336181640625, 0.93505859375, 1.533935546875, 2.1328125, 2.731689453125, 3.33056640625, 3.929443359375, 4.5283203125, 5.127197265625, 5.72607421875, 6.324951171875, 6.923828125, 7.522705078125, 8.12158203125, 8.720458984375, 9.3193359375, 9.918212890625, 10.51708984375, 11.115966796875, 11.71484375, 12.313720703125, 12.91259765625, 13.511474609375, 14.1103515625, 14.709228515625, 15.30810546875, 15.906982421875, 16.505859375, 17.104736328125, 17.70361328125, 18.302490234375, 18.9013671875, 19.500244140625, 20.09912109375, 20.697998046875, 21.296875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 9.0, 7.0, 18.0, 29.0, 21.0, 39.0, 49.0, 58.0, 83.0, 104.0, 88.0, 106.0, 77.0, 64.0, 63.0, 56.0, 34.0, 22.0, 19.0, 21.0, 10.0, 9.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.53125, -21.936279296875, -21.34130859375, -20.746337890625, -20.1513671875, -19.556396484375, -18.96142578125, -18.366455078125, -17.771484375, -17.176513671875, -16.58154296875, -15.986572265625, -15.3916015625, -14.796630859375, -14.20166015625, -13.606689453125, -13.01171875, -12.416748046875, -11.82177734375, -11.226806640625, -10.6318359375, -10.036865234375, -9.44189453125, -8.846923828125, -8.251953125, -7.656982421875, -7.06201171875, -6.467041015625, -5.8720703125, -5.277099609375, -4.68212890625, -4.087158203125, -3.4921875, -2.897216796875, -2.30224609375, -1.707275390625, -1.1123046875, -0.517333984375, 0.07763671875, 0.672607421875, 1.267578125, 1.862548828125, 2.45751953125, 3.052490234375, 3.6474609375, 4.242431640625, 4.83740234375, 5.432373046875, 6.02734375, 6.622314453125, 7.21728515625, 7.812255859375, 8.4072265625, 9.002197265625, 9.59716796875, 10.192138671875, 10.787109375, 11.382080078125, 11.97705078125, 12.572021484375, 13.1669921875, 13.761962890625, 14.35693359375, 14.951904296875, 15.546875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 6.0, 5.0, 9.0, 16.0, 34.0, 55.0, 94.0, 161.0, 209.0, 186.0, 118.0, 56.0, 25.0, 16.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-586.5119018554688, -574.9451293945312, -563.37841796875, -551.8116455078125, -540.244873046875, -528.6781616210938, -517.1113891601562, -505.54461669921875, -493.9778747558594, -482.4111328125, -470.8443603515625, -459.2776184082031, -447.71087646484375, -436.14410400390625, -424.5773620605469, -413.0106201171875, -401.44384765625, -389.8771057128906, -378.3103332519531, -366.74359130859375, -355.17681884765625, -343.6100769042969, -332.0433349609375, -320.4765625, -308.9098205566406, -297.34307861328125, -285.77630615234375, -274.2095642089844, -262.642822265625, -251.0760498046875, -239.50930786132812, -227.9425506591797, -216.3758087158203, -204.80905151367188, -193.2423095703125, -181.67555236816406, -170.10879516601562, -158.5420379638672, -146.97528076171875, -135.40853881835938, -123.84178161621094, -112.2750244140625, -100.7082748413086, -89.14152526855469, -77.57476806640625, -66.00801086425781, -54.441261291503906, -42.87451171875, -31.307754516601562, -19.74100112915039, -8.174247741699219, 3.392505645751953, 14.959259033203125, 26.526012420654297, 38.09276580810547, 49.659515380859375, 61.22627258300781, 72.79302978515625, 84.35977935791016, 95.92652893066406, 107.4932861328125, 119.06004333496094, 130.62680053710938, 142.19354248046875, 153.7602996826172]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 10.0, 8.0, 14.0, 15.0, 19.0, 27.0, 39.0, 39.0, 45.0, 49.0, 49.0, 58.0, 63.0, 89.0, 93.0, 73.0, 43.0, 49.0, 41.0, 35.0, 29.0, 25.0, 22.0, 22.0, 11.0, 12.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-228.87939453125, -219.91693115234375, -210.9544677734375, -201.99200439453125, -193.029541015625, -184.06707763671875, -175.1046142578125, -166.14215087890625, -157.1796875, -148.21722412109375, -139.2547607421875, -130.29229736328125, -121.329833984375, -112.36737060546875, -103.4049072265625, -94.44244384765625, -85.47998046875, -76.51751708984375, -67.5550537109375, -58.59259033203125, -49.630126953125, -40.66766357421875, -31.7052001953125, -22.74273681640625, -13.7802734375, -4.81781005859375, 4.1446533203125, 13.10711669921875, 22.069580078125, 31.03204345703125, 39.9945068359375, 48.95697021484375, 57.91943359375, 66.88189697265625, 75.8443603515625, 84.80682373046875, 93.769287109375, 102.73175048828125, 111.6942138671875, 120.65667724609375, 129.619140625, 138.58160400390625, 147.5440673828125, 156.50653076171875, 165.468994140625, 174.43145751953125, 183.3939208984375, 192.35638427734375, 201.31884765625, 210.28131103515625, 219.2437744140625, 228.20623779296875, 237.168701171875, 246.13116455078125, 255.0936279296875, 264.05609130859375, 273.0185546875, 281.98101806640625, 290.9434814453125, 299.90594482421875, 308.868408203125, 317.83087158203125, 326.7933349609375, 335.75579833984375, 344.71826171875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 8.0, 16.0, 14.0, 24.0, 43.0, 108.0, 268.0, 801.0, 3121.0, 23023.0, 786140.0, 3317894.0, 55518.0, 5470.0, 1113.0, 336.0, 156.0, 80.0, 46.0, 39.0, 22.0, 15.0, 10.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-46.84375, -45.3876953125, -43.931640625, -42.4755859375, -41.01953125, -39.5634765625, -38.107421875, -36.6513671875, -35.1953125, -33.7392578125, -32.283203125, -30.8271484375, -29.37109375, -27.9150390625, -26.458984375, -25.0029296875, -23.546875, -22.0908203125, -20.634765625, -19.1787109375, -17.72265625, -16.2666015625, -14.810546875, -13.3544921875, -11.8984375, -10.4423828125, -8.986328125, -7.5302734375, -6.07421875, -4.6181640625, -3.162109375, -1.7060546875, -0.25, 1.2060546875, 2.662109375, 4.1181640625, 5.57421875, 7.0302734375, 8.486328125, 9.9423828125, 11.3984375, 12.8544921875, 14.310546875, 15.7666015625, 17.22265625, 18.6787109375, 20.134765625, 21.5908203125, 23.046875, 24.5029296875, 25.958984375, 27.4150390625, 28.87109375, 30.3271484375, 31.783203125, 33.2392578125, 34.6953125, 36.1513671875, 37.607421875, 39.0634765625, 40.51953125, 41.9755859375, 43.431640625, 44.8876953125, 46.34375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 14.0, 15.0, 30.0, 59.0, 98.0, 163.0, 173.0, 150.0, 111.0, 63.0, 58.0, 39.0, 20.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.03125, -29.9921875, -28.953125, -27.9140625, -26.875, -25.8359375, -24.796875, -23.7578125, -22.71875, -21.6796875, -20.640625, -19.6015625, -18.5625, -17.5234375, -16.484375, -15.4453125, -14.40625, -13.3671875, -12.328125, -11.2890625, -10.25, -9.2109375, -8.171875, -7.1328125, -6.09375, -5.0546875, -4.015625, -2.9765625, -1.9375, -0.8984375, 0.140625, 1.1796875, 2.21875, 3.2578125, 4.296875, 5.3359375, 6.375, 7.4140625, 8.453125, 9.4921875, 10.53125, 11.5703125, 12.609375, 13.6484375, 14.6875, 15.7265625, 16.765625, 17.8046875, 18.84375, 19.8828125, 20.921875, 21.9609375, 23.0, 24.0390625, 25.078125, 26.1171875, 27.15625, 28.1953125, 29.234375, 30.2734375, 31.3125, 32.3515625, 33.390625, 34.4296875, 35.46875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 13.0, 6.0, 3.0, 15.0, 19.0, 22.0, 39.0, 82.0, 128.0, 233.0, 439.0, 959.0, 2931.0, 12016.0, 76497.0, 1546820.0, 2438042.0, 96294.0, 14260.0, 3342.0, 1095.0, 502.0, 214.0, 113.0, 71.0, 42.0, 32.0, 18.0, 12.0, 7.0, 9.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.640625, -28.545166015625, -27.44970703125, -26.354248046875, -25.2587890625, -24.163330078125, -23.06787109375, -21.972412109375, -20.876953125, -19.781494140625, -18.68603515625, -17.590576171875, -16.4951171875, -15.399658203125, -14.30419921875, -13.208740234375, -12.11328125, -11.017822265625, -9.92236328125, -8.826904296875, -7.7314453125, -6.635986328125, -5.54052734375, -4.445068359375, -3.349609375, -2.254150390625, -1.15869140625, -0.063232421875, 1.0322265625, 2.127685546875, 3.22314453125, 4.318603515625, 5.4140625, 6.509521484375, 7.60498046875, 8.700439453125, 9.7958984375, 10.891357421875, 11.98681640625, 13.082275390625, 14.177734375, 15.273193359375, 16.36865234375, 17.464111328125, 18.5595703125, 19.655029296875, 20.75048828125, 21.845947265625, 22.94140625, 24.036865234375, 25.13232421875, 26.227783203125, 27.3232421875, 28.418701171875, 29.51416015625, 30.609619140625, 31.705078125, 32.800537109375, 33.89599609375, 34.991455078125, 36.0869140625, 37.182373046875, 38.27783203125, 39.373291015625, 40.46875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 15.0, 25.0, 29.0, 42.0, 45.0, 77.0, 106.0, 186.0, 373.0, 624.0, 968.0, 703.0, 342.0, 196.0, 126.0, 72.0, 38.0, 29.0, 19.0, 12.0, 13.0, 9.0, 8.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.15625, -39.99658203125, -38.8369140625, -37.67724609375, -36.517578125, -35.35791015625, -34.1982421875, -33.03857421875, -31.87890625, -30.71923828125, -29.5595703125, -28.39990234375, -27.240234375, -26.08056640625, -24.9208984375, -23.76123046875, -22.6015625, -21.44189453125, -20.2822265625, -19.12255859375, -17.962890625, -16.80322265625, -15.6435546875, -14.48388671875, -13.32421875, -12.16455078125, -11.0048828125, -9.84521484375, -8.685546875, -7.52587890625, -6.3662109375, -5.20654296875, -4.046875, -2.88720703125, -1.7275390625, -0.56787109375, 0.591796875, 1.75146484375, 2.9111328125, 4.07080078125, 5.23046875, 6.39013671875, 7.5498046875, 8.70947265625, 9.869140625, 11.02880859375, 12.1884765625, 13.34814453125, 14.5078125, 15.66748046875, 16.8271484375, 17.98681640625, 19.146484375, 20.30615234375, 21.4658203125, 22.62548828125, 23.78515625, 24.94482421875, 26.1044921875, 27.26416015625, 28.423828125, 29.58349609375, 30.7431640625, 31.90283203125, 33.0625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 1.0, 3.0, 3.0, 15.0, 46.0, 138.0, 325.0, 307.0, 120.0, 29.0, 9.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-734.3785400390625, -716.8797607421875, -699.3809814453125, -681.8822021484375, -664.3834228515625, -646.8846435546875, -629.3858642578125, -611.8871459960938, -594.3883666992188, -576.8895874023438, -559.3908081054688, -541.8920288085938, -524.3932495117188, -506.8945007324219, -489.3957214355469, -471.8969421386719, -454.3981628417969, -436.8993835449219, -419.4006042480469, -401.90185546875, -384.403076171875, -366.904296875, -349.405517578125, -331.90673828125, -314.407958984375, -296.9091796875, -279.410400390625, -261.91162109375, -244.41287231445312, -226.91409301757812, -209.41531372070312, -191.91653442382812, -174.41775512695312, -156.91897583007812, -139.4202117919922, -121.92143249511719, -104.42266082763672, -86.92388916015625, -69.42510986328125, -51.92633819580078, -34.42756652832031, -16.92879295349121, 0.5699806213378906, 18.068756103515625, 35.567527770996094, 53.06629943847656, 70.56507873535156, 88.06385040283203, 105.5626220703125, 123.06139373779297, 140.56016540527344, 158.05894470214844, 175.55770874023438, 193.05648803710938, 210.55526733398438, 228.05404663085938, 245.5528106689453, 263.05157470703125, 280.55035400390625, 298.04913330078125, 315.54791259765625, 333.04669189453125, 350.54547119140625, 368.0442199707031, 385.5429992675781]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 7.0, 11.0, 14.0, 14.0, 23.0, 35.0, 35.0, 39.0, 61.0, 50.0, 54.0, 72.0, 70.0, 50.0, 73.0, 65.0, 63.0, 57.0, 45.0, 38.0, 32.0, 18.0, 19.0, 12.0, 11.0, 11.0, 8.0, 6.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-232.4778594970703, -226.46580505371094, -220.4537353515625, -214.44168090820312, -208.42962646484375, -202.4175567626953, -196.40550231933594, -190.3934326171875, -184.38137817382812, -178.36932373046875, -172.3572540283203, -166.34519958496094, -160.3331298828125, -154.32107543945312, -148.30902099609375, -142.29696655273438, -136.28489685058594, -130.27284240722656, -124.26077270507812, -118.24871826171875, -112.23665618896484, -106.22459411621094, -100.21253967285156, -94.20047760009766, -88.18841552734375, -82.17635345458984, -76.16429138183594, -70.15223693847656, -64.14017486572266, -58.12811279296875, -52.11605453491211, -46.10399627685547, -40.09193420410156, -34.079872131347656, -28.067813873291016, -22.055753707885742, -16.04369354248047, -10.031633377075195, -4.019573211669922, 1.9924850463867188, 8.004547119140625, 14.016607284545898, 20.028667449951172, 26.040727615356445, 32.05278778076172, 38.064849853515625, 44.076908111572266, 50.088966369628906, 56.10102844238281, 62.11309051513672, 68.12515258789062, 74.13720703125, 80.1492691040039, 86.16133117675781, 92.17338562011719, 98.1854476928711, 104.197509765625, 110.2095718383789, 116.22163391113281, 122.23368835449219, 128.24575805664062, 134.2578125, 140.26986694335938, 146.28192138671875, 152.2939910888672]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 5.0, 11.0, 12.0, 28.0, 16.0, 33.0, 59.0, 67.0, 98.0, 179.0, 349.0, 890.0, 2524.0, 9767.0, 51262.0, 280051.0, 535395.0, 135635.0, 24213.0, 5158.0, 1496.0, 549.0, 296.0, 134.0, 97.0, 57.0, 46.0, 43.0, 16.0, 19.0, 10.0, 16.0, 8.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-44.6875, -43.4208984375, -42.154296875, -40.8876953125, -39.62109375, -38.3544921875, -37.087890625, -35.8212890625, -34.5546875, -33.2880859375, -32.021484375, -30.7548828125, -29.48828125, -28.2216796875, -26.955078125, -25.6884765625, -24.421875, -23.1552734375, -21.888671875, -20.6220703125, -19.35546875, -18.0888671875, -16.822265625, -15.5556640625, -14.2890625, -13.0224609375, -11.755859375, -10.4892578125, -9.22265625, -7.9560546875, -6.689453125, -5.4228515625, -4.15625, -2.8896484375, -1.623046875, -0.3564453125, 0.91015625, 2.1767578125, 3.443359375, 4.7099609375, 5.9765625, 7.2431640625, 8.509765625, 9.7763671875, 11.04296875, 12.3095703125, 13.576171875, 14.8427734375, 16.109375, 17.3759765625, 18.642578125, 19.9091796875, 21.17578125, 22.4423828125, 23.708984375, 24.9755859375, 26.2421875, 27.5087890625, 28.775390625, 30.0419921875, 31.30859375, 32.5751953125, 33.841796875, 35.1083984375, 36.375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 0.0, 7.0, 7.0, 15.0, 38.0, 48.0, 105.0, 121.0, 139.0, 159.0, 122.0, 95.0, 58.0, 53.0, 24.0, 10.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.046875, -30.050537109375, -29.05419921875, -28.057861328125, -27.0615234375, -26.065185546875, -25.06884765625, -24.072509765625, -23.076171875, -22.079833984375, -21.08349609375, -20.087158203125, -19.0908203125, -18.094482421875, -17.09814453125, -16.101806640625, -15.10546875, -14.109130859375, -13.11279296875, -12.116455078125, -11.1201171875, -10.123779296875, -9.12744140625, -8.131103515625, -7.134765625, -6.138427734375, -5.14208984375, -4.145751953125, -3.1494140625, -2.153076171875, -1.15673828125, -0.160400390625, 0.8359375, 1.832275390625, 2.82861328125, 3.824951171875, 4.8212890625, 5.817626953125, 6.81396484375, 7.810302734375, 8.806640625, 9.802978515625, 10.79931640625, 11.795654296875, 12.7919921875, 13.788330078125, 14.78466796875, 15.781005859375, 16.77734375, 17.773681640625, 18.77001953125, 19.766357421875, 20.7626953125, 21.759033203125, 22.75537109375, 23.751708984375, 24.748046875, 25.744384765625, 26.74072265625, 27.737060546875, 28.7333984375, 29.729736328125, 30.72607421875, 31.722412109375, 32.71875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 7.0, 6.0, 6.0, 10.0, 14.0, 11.0, 24.0, 37.0, 45.0, 83.0, 139.0, 240.0, 450.0, 931.0, 2062.0, 6593.0, 48364.0, 828719.0, 143704.0, 11644.0, 2963.0, 1181.0, 571.0, 275.0, 169.0, 95.0, 61.0, 33.0, 24.0, 25.0, 22.0, 10.0, 7.0, 12.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-80.3125, -77.927734375, -75.54296875, -73.158203125, -70.7734375, -68.388671875, -66.00390625, -63.619140625, -61.234375, -58.849609375, -56.46484375, -54.080078125, -51.6953125, -49.310546875, -46.92578125, -44.541015625, -42.15625, -39.771484375, -37.38671875, -35.001953125, -32.6171875, -30.232421875, -27.84765625, -25.462890625, -23.078125, -20.693359375, -18.30859375, -15.923828125, -13.5390625, -11.154296875, -8.76953125, -6.384765625, -4.0, -1.615234375, 0.76953125, 3.154296875, 5.5390625, 7.923828125, 10.30859375, 12.693359375, 15.078125, 17.462890625, 19.84765625, 22.232421875, 24.6171875, 27.001953125, 29.38671875, 31.771484375, 34.15625, 36.541015625, 38.92578125, 41.310546875, 43.6953125, 46.080078125, 48.46484375, 50.849609375, 53.234375, 55.619140625, 58.00390625, 60.388671875, 62.7734375, 65.158203125, 67.54296875, 69.927734375, 72.3125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 6.0, 8.0, 11.0, 23.0, 21.0, 27.0, 35.0, 55.0, 100.0, 93.0, 116.0, 113.0, 89.0, 73.0, 63.0, 53.0, 39.0, 27.0, 12.0, 8.0, 7.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-120.9375, -117.4794921875, -114.021484375, -110.5634765625, -107.10546875, -103.6474609375, -100.189453125, -96.7314453125, -93.2734375, -89.8154296875, -86.357421875, -82.8994140625, -79.44140625, -75.9833984375, -72.525390625, -69.0673828125, -65.609375, -62.1513671875, -58.693359375, -55.2353515625, -51.77734375, -48.3193359375, -44.861328125, -41.4033203125, -37.9453125, -34.4873046875, -31.029296875, -27.5712890625, -24.11328125, -20.6552734375, -17.197265625, -13.7392578125, -10.28125, -6.8232421875, -3.365234375, 0.0927734375, 3.55078125, 7.0087890625, 10.466796875, 13.9248046875, 17.3828125, 20.8408203125, 24.298828125, 27.7568359375, 31.21484375, 34.6728515625, 38.130859375, 41.5888671875, 45.046875, 48.5048828125, 51.962890625, 55.4208984375, 58.87890625, 62.3369140625, 65.794921875, 69.2529296875, 72.7109375, 76.1689453125, 79.626953125, 83.0849609375, 86.54296875, 90.0009765625, 93.458984375, 96.9169921875, 100.375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 10.0, 12.0, 12.0, 17.0, 29.0, 39.0, 65.0, 133.0, 261.0, 651.0, 2041.0, 12669.0, 823779.0, 199737.0, 6703.0, 1445.0, 473.0, 208.0, 111.0, 51.0, 37.0, 17.0, 15.0, 13.0, 10.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.515625, -28.416748046875, -27.31787109375, -26.218994140625, -25.1201171875, -24.021240234375, -22.92236328125, -21.823486328125, -20.724609375, -19.625732421875, -18.52685546875, -17.427978515625, -16.3291015625, -15.230224609375, -14.13134765625, -13.032470703125, -11.93359375, -10.834716796875, -9.73583984375, -8.636962890625, -7.5380859375, -6.439208984375, -5.34033203125, -4.241455078125, -3.142578125, -2.043701171875, -0.94482421875, 0.154052734375, 1.2529296875, 2.351806640625, 3.45068359375, 4.549560546875, 5.6484375, 6.747314453125, 7.84619140625, 8.945068359375, 10.0439453125, 11.142822265625, 12.24169921875, 13.340576171875, 14.439453125, 15.538330078125, 16.63720703125, 17.736083984375, 18.8349609375, 19.933837890625, 21.03271484375, 22.131591796875, 23.23046875, 24.329345703125, 25.42822265625, 26.527099609375, 27.6259765625, 28.724853515625, 29.82373046875, 30.922607421875, 32.021484375, 33.120361328125, 34.21923828125, 35.318115234375, 36.4169921875, 37.515869140625, 38.61474609375, 39.713623046875, 40.8125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 6.0, 8.0, 7.0, 18.0, 20.0, 29.0, 36.0, 42.0, 73.0, 106.0, 144.0, 143.0, 132.0, 74.0, 43.0, 40.0, 32.0, 13.0, 13.0, 11.0, 9.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.005565643310546875, -0.005422830581665039, -0.005280017852783203, -0.005137205123901367, -0.004994392395019531, -0.004851579666137695, -0.004708766937255859, -0.0045659542083740234, -0.0044231414794921875, -0.0042803287506103516, -0.004137516021728516, -0.00399470329284668, -0.0038518905639648438, -0.003709077835083008, -0.003566265106201172, -0.003423452377319336, -0.0032806396484375, -0.003137826919555664, -0.002995014190673828, -0.002852201461791992, -0.0027093887329101562, -0.0025665760040283203, -0.0024237632751464844, -0.0022809505462646484, -0.0021381378173828125, -0.0019953250885009766, -0.0018525123596191406, -0.0017096996307373047, -0.0015668869018554688, -0.0014240741729736328, -0.0012812614440917969, -0.001138448715209961, -0.000995635986328125, -0.0008528232574462891, -0.0007100105285644531, -0.0005671977996826172, -0.00042438507080078125, -0.0002815723419189453, -0.00013875961303710938, 4.0531158447265625e-06, 0.0001468658447265625, 0.00028967857360839844, 0.0004324913024902344, 0.0005753040313720703, 0.0007181167602539062, 0.0008609294891357422, 0.0010037422180175781, 0.001146554946899414, 0.00128936767578125, 0.001432180404663086, 0.0015749931335449219, 0.0017178058624267578, 0.0018606185913085938, 0.0020034313201904297, 0.0021462440490722656, 0.0022890567779541016, 0.0024318695068359375, 0.0025746822357177734, 0.0027174949645996094, 0.0028603076934814453, 0.0030031204223632812, 0.003145933151245117, 0.003288745880126953, 0.003431558609008789, 0.003574371337890625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 7.0, 10.0, 8.0, 19.0, 32.0, 50.0, 87.0, 159.0, 353.0, 924.0, 2901.0, 14000.0, 753666.0, 263147.0, 9576.0, 2214.0, 734.0, 276.0, 152.0, 77.0, 61.0, 26.0, 16.0, 11.0, 4.0, 7.0, 6.0, 2.0, 4.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.484375, -26.423583984375, -25.36279296875, -24.302001953125, -23.2412109375, -22.180419921875, -21.11962890625, -20.058837890625, -18.998046875, -17.937255859375, -16.87646484375, -15.815673828125, -14.7548828125, -13.694091796875, -12.63330078125, -11.572509765625, -10.51171875, -9.450927734375, -8.39013671875, -7.329345703125, -6.2685546875, -5.207763671875, -4.14697265625, -3.086181640625, -2.025390625, -0.964599609375, 0.09619140625, 1.156982421875, 2.2177734375, 3.278564453125, 4.33935546875, 5.400146484375, 6.4609375, 7.521728515625, 8.58251953125, 9.643310546875, 10.7041015625, 11.764892578125, 12.82568359375, 13.886474609375, 14.947265625, 16.008056640625, 17.06884765625, 18.129638671875, 19.1904296875, 20.251220703125, 21.31201171875, 22.372802734375, 23.43359375, 24.494384765625, 25.55517578125, 26.615966796875, 27.6767578125, 28.737548828125, 29.79833984375, 30.859130859375, 31.919921875, 32.980712890625, 34.04150390625, 35.102294921875, 36.1630859375, 37.223876953125, 38.28466796875, 39.345458984375, 40.40625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 7.0, 23.0, 48.0, 108.0, 190.0, 223.0, 170.0, 102.0, 34.0, 34.0, 15.0, 6.0, 9.0, 7.0, 3.0, 4.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.96875, -24.85888671875, -23.7490234375, -22.63916015625, -21.529296875, -20.41943359375, -19.3095703125, -18.19970703125, -17.08984375, -15.97998046875, -14.8701171875, -13.76025390625, -12.650390625, -11.54052734375, -10.4306640625, -9.32080078125, -8.2109375, -7.10107421875, -5.9912109375, -4.88134765625, -3.771484375, -2.66162109375, -1.5517578125, -0.44189453125, 0.66796875, 1.77783203125, 2.8876953125, 3.99755859375, 5.107421875, 6.21728515625, 7.3271484375, 8.43701171875, 9.546875, 10.65673828125, 11.7666015625, 12.87646484375, 13.986328125, 15.09619140625, 16.2060546875, 17.31591796875, 18.42578125, 19.53564453125, 20.6455078125, 21.75537109375, 22.865234375, 23.97509765625, 25.0849609375, 26.19482421875, 27.3046875, 28.41455078125, 29.5244140625, 30.63427734375, 31.744140625, 32.85400390625, 33.9638671875, 35.07373046875, 36.18359375, 37.29345703125, 38.4033203125, 39.51318359375, 40.623046875, 41.73291015625, 42.8427734375, 43.95263671875, 45.0625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 6.0, 10.0, 53.0, 117.0, 281.0, 292.0, 123.0, 66.0, 25.0, 12.0, 7.0, 3.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-283.630126953125, -267.9104309082031, -252.1907501220703, -236.4710693359375, -220.75137329101562, -205.0316925048828, -189.31201171875, -173.59231567382812, -157.8726348876953, -142.1529541015625, -126.43325805664062, -110.71357727050781, -94.99388885498047, -79.27420043945312, -63.55451965332031, -47.83483123779297, -32.115142822265625, -16.395456314086914, -0.6757698059082031, 15.043914794921875, 30.76360321044922, 46.48329162597656, 62.202972412109375, 77.92266082763672, 93.64234924316406, 109.3620376586914, 125.08172607421875, 140.80140686035156, 156.52108764648438, 172.24078369140625, 187.96046447753906, 203.68014526367188, 219.39984130859375, 235.11952209472656, 250.83921813964844, 266.55889892578125, 282.2785949707031, 297.998291015625, 313.71795654296875, 329.4376525878906, 345.1573486328125, 360.8770446777344, 376.5967102050781, 392.31640625, 408.0361022949219, 423.75579833984375, 439.4754638671875, 455.1951599121094, 470.9148254394531, 486.634521484375, 502.35418701171875, 518.0738525390625, 533.7935791015625, 549.5132446289062, 565.23291015625, 580.95263671875, 596.6723022460938, 612.3919677734375, 628.1116943359375, 643.8313598632812, 659.551025390625, 675.270751953125, 690.9904174804688, 706.7100830078125, 722.4298095703125]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 8.0, 7.0, 10.0, 12.0, 18.0, 25.0, 22.0, 38.0, 31.0, 45.0, 50.0, 44.0, 89.0, 103.0, 92.0, 87.0, 61.0, 45.0, 54.0, 39.0, 25.0, 23.0, 24.0, 12.0, 16.0, 8.0, 6.0, 8.0, 4.0, 1.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-273.3094482421875, -263.60888671875, -253.90829467773438, -244.2077178955078, -234.50714111328125, -224.8065643310547, -215.10598754882812, -205.40541076660156, -195.704833984375, -186.00425720214844, -176.30368041992188, -166.6031036376953, -156.90252685546875, -147.2019500732422, -137.50137329101562, -127.80079650878906, -118.1002197265625, -108.39964294433594, -98.69906616210938, -88.99848937988281, -79.29791259765625, -69.59733581542969, -59.896759033203125, -50.19618225097656, -40.49560546875, -30.795028686523438, -21.094451904296875, -11.393875122070312, -1.69329833984375, 8.007278442382812, 17.707855224609375, 27.408432006835938, 37.108978271484375, 46.80955505371094, 56.5101318359375, 66.21070861816406, 75.91128540039062, 85.61186218261719, 95.31243896484375, 105.01301574707031, 114.71359252929688, 124.41416931152344, 134.11474609375, 143.81532287597656, 153.51589965820312, 163.2164764404297, 172.91705322265625, 182.6176300048828, 192.31820678710938, 202.01878356933594, 211.7193603515625, 221.41993713378906, 231.12051391601562, 240.8210906982422, 250.52166748046875, 260.22222900390625, 269.9228210449219, 279.6234130859375, 289.323974609375, 299.0245361328125, 308.7251281738281, 318.42572021484375, 328.12628173828125, 337.82684326171875, 347.5274353027344]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 5.0, 9.0, 11.0, 46.0, 70.0, 169.0, 389.0, 1441.0, 9417.0, 230357.0, 3839806.0, 105356.0, 5558.0, 1010.0, 330.0, 154.0, 65.0, 36.0, 20.0, 9.0, 8.0, 11.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.9375, -50.683349609375, -49.42919921875, -48.175048828125, -46.9208984375, -45.666748046875, -44.41259765625, -43.158447265625, -41.904296875, -40.650146484375, -39.39599609375, -38.141845703125, -36.8876953125, -35.633544921875, -34.37939453125, -33.125244140625, -31.87109375, -30.616943359375, -29.36279296875, -28.108642578125, -26.8544921875, -25.600341796875, -24.34619140625, -23.092041015625, -21.837890625, -20.583740234375, -19.32958984375, -18.075439453125, -16.8212890625, -15.567138671875, -14.31298828125, -13.058837890625, -11.8046875, -10.550537109375, -9.29638671875, -8.042236328125, -6.7880859375, -5.533935546875, -4.27978515625, -3.025634765625, -1.771484375, -0.517333984375, 0.73681640625, 1.990966796875, 3.2451171875, 4.499267578125, 5.75341796875, 7.007568359375, 8.26171875, 9.515869140625, 10.77001953125, 12.024169921875, 13.2783203125, 14.532470703125, 15.78662109375, 17.040771484375, 18.294921875, 19.549072265625, 20.80322265625, 22.057373046875, 23.3115234375, 24.565673828125, 25.81982421875, 27.073974609375, 28.328125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 6.0, 9.0, 15.0, 20.0, 23.0, 29.0, 33.0, 50.0, 51.0, 72.0, 67.0, 77.0, 84.0, 82.0, 61.0, 65.0, 53.0, 50.0, 43.0, 35.0, 29.0, 17.0, 9.0, 9.0, 5.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.28125, -10.75927734375, -10.2373046875, -9.71533203125, -9.193359375, -8.67138671875, -8.1494140625, -7.62744140625, -7.10546875, -6.58349609375, -6.0615234375, -5.53955078125, -5.017578125, -4.49560546875, -3.9736328125, -3.45166015625, -2.9296875, -2.40771484375, -1.8857421875, -1.36376953125, -0.841796875, -0.31982421875, 0.2021484375, 0.72412109375, 1.24609375, 1.76806640625, 2.2900390625, 2.81201171875, 3.333984375, 3.85595703125, 4.3779296875, 4.89990234375, 5.421875, 5.94384765625, 6.4658203125, 6.98779296875, 7.509765625, 8.03173828125, 8.5537109375, 9.07568359375, 9.59765625, 10.11962890625, 10.6416015625, 11.16357421875, 11.685546875, 12.20751953125, 12.7294921875, 13.25146484375, 13.7734375, 14.29541015625, 14.8173828125, 15.33935546875, 15.861328125, 16.38330078125, 16.9052734375, 17.42724609375, 17.94921875, 18.47119140625, 18.9931640625, 19.51513671875, 20.037109375, 20.55908203125, 21.0810546875, 21.60302734375, 22.125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 5.0, 7.0, 17.0, 27.0, 28.0, 43.0, 75.0, 111.0, 212.0, 314.0, 701.0, 1760.0, 5786.0, 24080.0, 163571.0, 3152966.0, 772413.0, 55475.0, 11193.0, 3034.0, 1125.0, 544.0, 305.0, 162.0, 111.0, 68.0, 47.0, 27.0, 15.0, 18.0, 9.0, 9.0, 1.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.25, -20.425048828125, -19.60009765625, -18.775146484375, -17.9501953125, -17.125244140625, -16.30029296875, -15.475341796875, -14.650390625, -13.825439453125, -13.00048828125, -12.175537109375, -11.3505859375, -10.525634765625, -9.70068359375, -8.875732421875, -8.05078125, -7.225830078125, -6.40087890625, -5.575927734375, -4.7509765625, -3.926025390625, -3.10107421875, -2.276123046875, -1.451171875, -0.626220703125, 0.19873046875, 1.023681640625, 1.8486328125, 2.673583984375, 3.49853515625, 4.323486328125, 5.1484375, 5.973388671875, 6.79833984375, 7.623291015625, 8.4482421875, 9.273193359375, 10.09814453125, 10.923095703125, 11.748046875, 12.572998046875, 13.39794921875, 14.222900390625, 15.0478515625, 15.872802734375, 16.69775390625, 17.522705078125, 18.34765625, 19.172607421875, 19.99755859375, 20.822509765625, 21.6474609375, 22.472412109375, 23.29736328125, 24.122314453125, 24.947265625, 25.772216796875, 26.59716796875, 27.422119140625, 28.2470703125, 29.072021484375, 29.89697265625, 30.721923828125, 31.546875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 7.0, 5.0, 18.0, 17.0, 26.0, 44.0, 66.0, 91.0, 201.0, 391.0, 818.0, 979.0, 707.0, 325.0, 184.0, 66.0, 43.0, 27.0, 17.0, 18.0, 8.0, 4.0, 6.0, 6.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.5, -24.35986328125, -23.2197265625, -22.07958984375, -20.939453125, -19.79931640625, -18.6591796875, -17.51904296875, -16.37890625, -15.23876953125, -14.0986328125, -12.95849609375, -11.818359375, -10.67822265625, -9.5380859375, -8.39794921875, -7.2578125, -6.11767578125, -4.9775390625, -3.83740234375, -2.697265625, -1.55712890625, -0.4169921875, 0.72314453125, 1.86328125, 3.00341796875, 4.1435546875, 5.28369140625, 6.423828125, 7.56396484375, 8.7041015625, 9.84423828125, 10.984375, 12.12451171875, 13.2646484375, 14.40478515625, 15.544921875, 16.68505859375, 17.8251953125, 18.96533203125, 20.10546875, 21.24560546875, 22.3857421875, 23.52587890625, 24.666015625, 25.80615234375, 26.9462890625, 28.08642578125, 29.2265625, 30.36669921875, 31.5068359375, 32.64697265625, 33.787109375, 34.92724609375, 36.0673828125, 37.20751953125, 38.34765625, 39.48779296875, 40.6279296875, 41.76806640625, 42.908203125, 44.04833984375, 45.1884765625, 46.32861328125, 47.46875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 9.0, 14.0, 35.0, 90.0, 210.0, 250.0, 203.0, 110.0, 31.0, 20.0, 8.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-445.8471374511719, -436.294677734375, -426.7422180175781, -417.18975830078125, -407.6372985839844, -398.0848388671875, -388.5323791503906, -378.97991943359375, -369.427490234375, -359.8750305175781, -350.32257080078125, -340.7701110839844, -331.2176513671875, -321.6651916503906, -312.11273193359375, -302.560302734375, -293.0078125, -283.4553527832031, -273.90289306640625, -264.3504333496094, -254.7979736328125, -245.24551391601562, -235.6930694580078, -226.14060974121094, -216.58815002441406, -207.0356903076172, -197.4832305908203, -187.93077087402344, -178.37832641601562, -168.82586669921875, -159.27340698242188, -149.720947265625, -140.16848754882812, -130.61602783203125, -121.06356811523438, -111.51111602783203, -101.95865631103516, -92.40619659423828, -82.85374450683594, -73.30128479003906, -63.74882507324219, -54.19636535644531, -44.6439094543457, -35.091453552246094, -25.53899383544922, -15.986534118652344, -6.434078216552734, 3.118377685546875, 12.67083740234375, 22.223295211791992, 31.775753021240234, 41.328208923339844, 50.88066864013672, 60.433128356933594, 69.98558044433594, 79.53804016113281, 89.09049987792969, 98.64295959472656, 108.19541931152344, 117.74787139892578, 127.30033111572266, 136.852783203125, 146.40524291992188, 155.95770263671875, 165.51016235351562]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 7.0, 12.0, 7.0, 7.0, 11.0, 16.0, 18.0, 32.0, 31.0, 25.0, 31.0, 37.0, 36.0, 41.0, 58.0, 66.0, 54.0, 51.0, 52.0, 53.0, 44.0, 50.0, 38.0, 41.0, 32.0, 22.0, 21.0, 23.0, 14.0, 17.0, 7.0, 9.0, 9.0, 4.0, 4.0, 0.0, 2.0, 7.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-124.53396606445312, -120.87499237060547, -117.21602630615234, -113.55705261230469, -109.89808654785156, -106.2391128540039, -102.58013916015625, -98.92117309570312, -95.26219940185547, -91.60322570800781, -87.94425964355469, -84.28528594970703, -80.6263198852539, -76.96734619140625, -73.30838012695312, -69.64940643310547, -65.99043273925781, -62.33146286010742, -58.67249298095703, -55.013519287109375, -51.354549407958984, -47.695579528808594, -44.0366096496582, -40.37763977050781, -36.71867370605469, -33.0597038269043, -29.400732040405273, -25.741762161254883, -22.08279037475586, -18.42382049560547, -14.764850616455078, -11.105878829956055, -7.446907043457031, -3.7879364490509033, -0.1289658546447754, 3.5300045013427734, 7.1889753341674805, 10.847946166992188, 14.506916046142578, 18.1658878326416, 21.824857711791992, 25.483827590942383, 29.142799377441406, 32.8017692565918, 36.46073913574219, 40.119712829589844, 43.77867889404297, 47.437652587890625, 51.096622467041016, 54.755592346191406, 58.4145622253418, 62.07353210449219, 65.73250579833984, 69.3914794921875, 73.05044555664062, 76.70941925048828, 80.3683853149414, 84.02735900878906, 87.68632507324219, 91.34529876708984, 95.00426483154297, 98.66323852539062, 102.32220458984375, 105.9811782836914, 109.64015197753906]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 6.0, 7.0, 9.0, 17.0, 20.0, 34.0, 58.0, 66.0, 128.0, 214.0, 417.0, 975.0, 2227.0, 6286.0, 21033.0, 84826.0, 350993.0, 428785.0, 112386.0, 27316.0, 7732.0, 2789.0, 1070.0, 478.0, 288.0, 147.0, 89.0, 53.0, 29.0, 23.0, 18.0, 13.0, 6.0, 7.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-40.625, -39.61181640625, -38.5986328125, -37.58544921875, -36.572265625, -35.55908203125, -34.5458984375, -33.53271484375, -32.51953125, -31.50634765625, -30.4931640625, -29.47998046875, -28.466796875, -27.45361328125, -26.4404296875, -25.42724609375, -24.4140625, -23.40087890625, -22.3876953125, -21.37451171875, -20.361328125, -19.34814453125, -18.3349609375, -17.32177734375, -16.30859375, -15.29541015625, -14.2822265625, -13.26904296875, -12.255859375, -11.24267578125, -10.2294921875, -9.21630859375, -8.203125, -7.18994140625, -6.1767578125, -5.16357421875, -4.150390625, -3.13720703125, -2.1240234375, -1.11083984375, -0.09765625, 0.91552734375, 1.9287109375, 2.94189453125, 3.955078125, 4.96826171875, 5.9814453125, 6.99462890625, 8.0078125, 9.02099609375, 10.0341796875, 11.04736328125, 12.060546875, 13.07373046875, 14.0869140625, 15.10009765625, 16.11328125, 17.12646484375, 18.1396484375, 19.15283203125, 20.166015625, 21.17919921875, 22.1923828125, 23.20556640625, 24.21875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 6.0, 7.0, 10.0, 14.0, 22.0, 19.0, 24.0, 39.0, 29.0, 44.0, 31.0, 53.0, 57.0, 44.0, 51.0, 73.0, 51.0, 58.0, 48.0, 42.0, 49.0, 41.0, 34.0, 41.0, 26.0, 31.0, 19.0, 11.0, 7.0, 8.0, 11.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1171875, -11.722412109375, -11.32763671875, -10.932861328125, -10.5380859375, -10.143310546875, -9.74853515625, -9.353759765625, -8.958984375, -8.564208984375, -8.16943359375, -7.774658203125, -7.3798828125, -6.985107421875, -6.59033203125, -6.195556640625, -5.80078125, -5.406005859375, -5.01123046875, -4.616455078125, -4.2216796875, -3.826904296875, -3.43212890625, -3.037353515625, -2.642578125, -2.247802734375, -1.85302734375, -1.458251953125, -1.0634765625, -0.668701171875, -0.27392578125, 0.120849609375, 0.515625, 0.910400390625, 1.30517578125, 1.699951171875, 2.0947265625, 2.489501953125, 2.88427734375, 3.279052734375, 3.673828125, 4.068603515625, 4.46337890625, 4.858154296875, 5.2529296875, 5.647705078125, 6.04248046875, 6.437255859375, 6.83203125, 7.226806640625, 7.62158203125, 8.016357421875, 8.4111328125, 8.805908203125, 9.20068359375, 9.595458984375, 9.990234375, 10.385009765625, 10.77978515625, 11.174560546875, 11.5693359375, 11.964111328125, 12.35888671875, 12.753662109375, 13.1484375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 4.0, 12.0, 16.0, 31.0, 57.0, 107.0, 166.0, 313.0, 594.0, 1400.0, 4010.0, 27932.0, 729711.0, 265289.0, 13894.0, 2774.0, 1112.0, 480.0, 274.0, 147.0, 91.0, 41.0, 34.0, 21.0, 12.0, 5.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.125, -71.869140625, -69.61328125, -67.357421875, -65.1015625, -62.845703125, -60.58984375, -58.333984375, -56.078125, -53.822265625, -51.56640625, -49.310546875, -47.0546875, -44.798828125, -42.54296875, -40.287109375, -38.03125, -35.775390625, -33.51953125, -31.263671875, -29.0078125, -26.751953125, -24.49609375, -22.240234375, -19.984375, -17.728515625, -15.47265625, -13.216796875, -10.9609375, -8.705078125, -6.44921875, -4.193359375, -1.9375, 0.318359375, 2.57421875, 4.830078125, 7.0859375, 9.341796875, 11.59765625, 13.853515625, 16.109375, 18.365234375, 20.62109375, 22.876953125, 25.1328125, 27.388671875, 29.64453125, 31.900390625, 34.15625, 36.412109375, 38.66796875, 40.923828125, 43.1796875, 45.435546875, 47.69140625, 49.947265625, 52.203125, 54.458984375, 56.71484375, 58.970703125, 61.2265625, 63.482421875, 65.73828125, 67.994140625, 70.25]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 3.0, 5.0, 5.0, 8.0, 6.0, 7.0, 10.0, 12.0, 19.0, 17.0, 24.0, 32.0, 29.0, 29.0, 31.0, 49.0, 52.0, 54.0, 56.0, 50.0, 48.0, 48.0, 45.0, 52.0, 54.0, 38.0, 33.0, 37.0, 29.0, 16.0, 23.0, 18.0, 9.0, 6.0, 14.0, 9.0, 6.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-41.15625, -39.8251953125, -38.494140625, -37.1630859375, -35.83203125, -34.5009765625, -33.169921875, -31.8388671875, -30.5078125, -29.1767578125, -27.845703125, -26.5146484375, -25.18359375, -23.8525390625, -22.521484375, -21.1904296875, -19.859375, -18.5283203125, -17.197265625, -15.8662109375, -14.53515625, -13.2041015625, -11.873046875, -10.5419921875, -9.2109375, -7.8798828125, -6.548828125, -5.2177734375, -3.88671875, -2.5556640625, -1.224609375, 0.1064453125, 1.4375, 2.7685546875, 4.099609375, 5.4306640625, 6.76171875, 8.0927734375, 9.423828125, 10.7548828125, 12.0859375, 13.4169921875, 14.748046875, 16.0791015625, 17.41015625, 18.7412109375, 20.072265625, 21.4033203125, 22.734375, 24.0654296875, 25.396484375, 26.7275390625, 28.05859375, 29.3896484375, 30.720703125, 32.0517578125, 33.3828125, 34.7138671875, 36.044921875, 37.3759765625, 38.70703125, 40.0380859375, 41.369140625, 42.7001953125, 44.03125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 0.0, 5.0, 3.0, 12.0, 8.0, 17.0, 15.0, 17.0, 34.0, 57.0, 81.0, 148.0, 257.0, 568.0, 1710.0, 8699.0, 134774.0, 850641.0, 44548.0, 4866.0, 1106.0, 408.0, 216.0, 110.0, 80.0, 61.0, 33.0, 19.0, 19.0, 10.0, 10.0, 7.0, 4.0, 4.0, 6.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.75, -18.1318359375, -17.513671875, -16.8955078125, -16.27734375, -15.6591796875, -15.041015625, -14.4228515625, -13.8046875, -13.1865234375, -12.568359375, -11.9501953125, -11.33203125, -10.7138671875, -10.095703125, -9.4775390625, -8.859375, -8.2412109375, -7.623046875, -7.0048828125, -6.38671875, -5.7685546875, -5.150390625, -4.5322265625, -3.9140625, -3.2958984375, -2.677734375, -2.0595703125, -1.44140625, -0.8232421875, -0.205078125, 0.4130859375, 1.03125, 1.6494140625, 2.267578125, 2.8857421875, 3.50390625, 4.1220703125, 4.740234375, 5.3583984375, 5.9765625, 6.5947265625, 7.212890625, 7.8310546875, 8.44921875, 9.0673828125, 9.685546875, 10.3037109375, 10.921875, 11.5400390625, 12.158203125, 12.7763671875, 13.39453125, 14.0126953125, 14.630859375, 15.2490234375, 15.8671875, 16.4853515625, 17.103515625, 17.7216796875, 18.33984375, 18.9580078125, 19.576171875, 20.1943359375, 20.8125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 1.0, 8.0, 10.0, 14.0, 19.0, 25.0, 29.0, 35.0, 41.0, 63.0, 73.0, 81.0, 105.0, 110.0, 97.0, 67.0, 54.0, 38.0, 35.0, 20.0, 19.0, 6.0, 10.0, 6.0, 4.0, 4.0, 4.0, 4.0, 5.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00267791748046875, -0.0025854110717773438, -0.0024929046630859375, -0.0024003982543945312, -0.002307891845703125, -0.0022153854370117188, -0.0021228790283203125, -0.0020303726196289062, -0.0019378662109375, -0.0018453598022460938, -0.0017528533935546875, -0.0016603469848632812, -0.001567840576171875, -0.0014753341674804688, -0.0013828277587890625, -0.0012903213500976562, -0.00119781494140625, -0.0011053085327148438, -0.0010128021240234375, -0.0009202957153320312, -0.000827789306640625, -0.0007352828979492188, -0.0006427764892578125, -0.0005502700805664062, -0.000457763671875, -0.00036525726318359375, -0.0002727508544921875, -0.00018024444580078125, -8.7738037109375e-05, 4.76837158203125e-06, 9.72747802734375e-05, 0.00018978118896484375, 0.00028228759765625, 0.00037479400634765625, 0.0004673004150390625, 0.0005598068237304688, 0.000652313232421875, 0.0007448196411132812, 0.0008373260498046875, 0.0009298324584960938, 0.0010223388671875, 0.0011148452758789062, 0.0012073516845703125, 0.0012998580932617188, 0.001392364501953125, 0.0014848709106445312, 0.0015773773193359375, 0.0016698837280273438, 0.00176239013671875, 0.0018548965454101562, 0.0019474029541015625, 0.0020399093627929688, 0.002132415771484375, 0.0022249221801757812, 0.0023174285888671875, 0.0024099349975585938, 0.00250244140625, 0.0025949478149414062, 0.0026874542236328125, 0.0027799606323242188, 0.002872467041015625, 0.0029649734497070312, 0.0030574798583984375, 0.0031499862670898438, 0.00324249267578125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 10.0, 7.0, 11.0, 9.0, 14.0, 31.0, 41.0, 60.0, 107.0, 162.0, 323.0, 567.0, 1307.0, 3769.0, 16008.0, 202217.0, 766212.0, 46512.0, 7165.0, 2198.0, 856.0, 394.0, 224.0, 119.0, 79.0, 38.0, 32.0, 22.0, 21.0, 17.0, 4.0, 6.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.65625, -13.155029296875, -12.65380859375, -12.152587890625, -11.6513671875, -11.150146484375, -10.64892578125, -10.147705078125, -9.646484375, -9.145263671875, -8.64404296875, -8.142822265625, -7.6416015625, -7.140380859375, -6.63916015625, -6.137939453125, -5.63671875, -5.135498046875, -4.63427734375, -4.133056640625, -3.6318359375, -3.130615234375, -2.62939453125, -2.128173828125, -1.626953125, -1.125732421875, -0.62451171875, -0.123291015625, 0.3779296875, 0.879150390625, 1.38037109375, 1.881591796875, 2.3828125, 2.884033203125, 3.38525390625, 3.886474609375, 4.3876953125, 4.888916015625, 5.39013671875, 5.891357421875, 6.392578125, 6.893798828125, 7.39501953125, 7.896240234375, 8.3974609375, 8.898681640625, 9.39990234375, 9.901123046875, 10.40234375, 10.903564453125, 11.40478515625, 11.906005859375, 12.4072265625, 12.908447265625, 13.40966796875, 13.910888671875, 14.412109375, 14.913330078125, 15.41455078125, 15.915771484375, 16.4169921875, 16.918212890625, 17.41943359375, 17.920654296875, 18.421875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 6.0, 1.0, 5.0, 7.0, 4.0, 7.0, 9.0, 16.0, 23.0, 50.0, 103.0, 114.0, 156.0, 143.0, 140.0, 82.0, 52.0, 36.0, 18.0, 15.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.875, -23.229736328125, -22.58447265625, -21.939208984375, -21.2939453125, -20.648681640625, -20.00341796875, -19.358154296875, -18.712890625, -18.067626953125, -17.42236328125, -16.777099609375, -16.1318359375, -15.486572265625, -14.84130859375, -14.196044921875, -13.55078125, -12.905517578125, -12.26025390625, -11.614990234375, -10.9697265625, -10.324462890625, -9.67919921875, -9.033935546875, -8.388671875, -7.743408203125, -7.09814453125, -6.452880859375, -5.8076171875, -5.162353515625, -4.51708984375, -3.871826171875, -3.2265625, -2.581298828125, -1.93603515625, -1.290771484375, -0.6455078125, -0.000244140625, 0.64501953125, 1.290283203125, 1.935546875, 2.580810546875, 3.22607421875, 3.871337890625, 4.5166015625, 5.161865234375, 5.80712890625, 6.452392578125, 7.09765625, 7.742919921875, 8.38818359375, 9.033447265625, 9.6787109375, 10.323974609375, 10.96923828125, 11.614501953125, 12.259765625, 12.905029296875, 13.55029296875, 14.195556640625, 14.8408203125, 15.486083984375, 16.13134765625, 16.776611328125, 17.421875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 4.0, 12.0, 56.0, 253.0, 486.0, 153.0, 24.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-604.149169921875, -582.058837890625, -559.968505859375, -537.878173828125, -515.787841796875, -493.697509765625, -471.607177734375, -449.516845703125, -427.426513671875, -405.336181640625, -383.245849609375, -361.155517578125, -339.065185546875, -316.974853515625, -294.884521484375, -272.794189453125, -250.703857421875, -228.613525390625, -206.523193359375, -184.432861328125, -162.342529296875, -140.252197265625, -118.161865234375, -96.071533203125, -73.981201171875, -51.890869140625, -29.800537109375, -7.710205078125, 14.380126953125, 36.470458984375, 58.560791015625, 80.651123046875, 102.74139404296875, 124.83172607421875, 146.92205810546875, 169.01239013671875, 191.10272216796875, 213.19305419921875, 235.28338623046875, 257.37371826171875, 279.46405029296875, 301.55438232421875, 323.64471435546875, 345.73504638671875, 367.82537841796875, 389.91571044921875, 412.00604248046875, 434.09637451171875, 456.18670654296875, 478.27703857421875, 500.36737060546875, 522.4577026367188, 544.5480346679688, 566.6383666992188, 588.7286987304688, 610.8190307617188, 632.9093627929688, 654.9996948242188, 677.0900268554688, 699.1803588867188, 721.2706909179688, 743.3610229492188, 765.4513549804688, 787.5416870117188, 809.6320190429688]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 7.0, 11.0, 10.0, 7.0, 14.0, 30.0, 13.0, 18.0, 17.0, 23.0, 27.0, 27.0, 28.0, 33.0, 34.0, 47.0, 51.0, 50.0, 76.0, 65.0, 55.0, 29.0, 40.0, 30.0, 33.0, 34.0, 27.0, 25.0, 18.0, 20.0, 15.0, 12.0, 14.0, 5.0, 8.0, 9.0, 6.0, 6.0, 4.0, 5.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-145.0458984375, -140.1067657470703, -135.16763305664062, -130.228515625, -125.28938293457031, -120.35025024414062, -115.41111755371094, -110.47198486328125, -105.5328598022461, -100.5937271118164, -95.65460205078125, -90.71546936035156, -85.77633666992188, -80.83721160888672, -75.89807891845703, -70.95895385742188, -66.01982116699219, -61.080692291259766, -56.141563415527344, -51.202430725097656, -46.263301849365234, -41.32417297363281, -36.385040283203125, -31.445911407470703, -26.50678253173828, -21.56765365600586, -16.628522872924805, -11.689393043518066, -6.750263214111328, -1.8111343383789062, 3.1279964447021484, 8.067127227783203, 13.006256103515625, 17.945384979248047, 22.8845157623291, 27.823646545410156, 32.76277542114258, 37.701904296875, 42.64103698730469, 47.58016586303711, 52.51929473876953, 57.45842361450195, 62.397552490234375, 67.33668518066406, 72.27581787109375, 77.2149429321289, 82.1540756225586, 87.09320068359375, 92.03233337402344, 96.97146606445312, 101.91059112548828, 106.84972381591797, 111.78884887695312, 116.72798156738281, 121.6671142578125, 126.60624694824219, 131.54537963867188, 136.48451232910156, 141.42364501953125, 146.36276245117188, 151.30189514160156, 156.24102783203125, 161.18016052246094, 166.11929321289062, 171.05841064453125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 1.0, 5.0, 6.0, 9.0, 20.0, 23.0, 28.0, 43.0, 61.0, 109.0, 155.0, 301.0, 585.0, 1219.0, 3088.0, 10257.0, 52852.0, 633515.0, 3037607.0, 405086.0, 36823.0, 7897.0, 2432.0, 989.0, 459.0, 248.0, 167.0, 95.0, 72.0, 42.0, 31.0, 20.0, 13.0, 1.0, 7.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.7265625, -15.1920166015625, -14.657470703125, -14.1229248046875, -13.58837890625, -13.0538330078125, -12.519287109375, -11.9847412109375, -11.4501953125, -10.9156494140625, -10.381103515625, -9.8465576171875, -9.31201171875, -8.7774658203125, -8.242919921875, -7.7083740234375, -7.173828125, -6.6392822265625, -6.104736328125, -5.5701904296875, -5.03564453125, -4.5010986328125, -3.966552734375, -3.4320068359375, -2.8974609375, -2.3629150390625, -1.828369140625, -1.2938232421875, -0.75927734375, -0.2247314453125, 0.309814453125, 0.8443603515625, 1.37890625, 1.9134521484375, 2.447998046875, 2.9825439453125, 3.51708984375, 4.0516357421875, 4.586181640625, 5.1207275390625, 5.6552734375, 6.1898193359375, 6.724365234375, 7.2589111328125, 7.79345703125, 8.3280029296875, 8.862548828125, 9.3970947265625, 9.931640625, 10.4661865234375, 11.000732421875, 11.5352783203125, 12.06982421875, 12.6043701171875, 13.138916015625, 13.6734619140625, 14.2080078125, 14.7425537109375, 15.277099609375, 15.8116455078125, 16.34619140625, 16.8807373046875, 17.415283203125, 17.9498291015625, 18.484375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 7.0, 10.0, 15.0, 15.0, 18.0, 18.0, 24.0, 34.0, 42.0, 31.0, 32.0, 54.0, 53.0, 60.0, 58.0, 54.0, 66.0, 58.0, 60.0, 44.0, 33.0, 39.0, 29.0, 31.0, 28.0, 21.0, 14.0, 15.0, 9.0, 8.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.28125, -9.931884765625, -9.58251953125, -9.233154296875, -8.8837890625, -8.534423828125, -8.18505859375, -7.835693359375, -7.486328125, -7.136962890625, -6.78759765625, -6.438232421875, -6.0888671875, -5.739501953125, -5.39013671875, -5.040771484375, -4.69140625, -4.342041015625, -3.99267578125, -3.643310546875, -3.2939453125, -2.944580078125, -2.59521484375, -2.245849609375, -1.896484375, -1.547119140625, -1.19775390625, -0.848388671875, -0.4990234375, -0.149658203125, 0.19970703125, 0.549072265625, 0.8984375, 1.247802734375, 1.59716796875, 1.946533203125, 2.2958984375, 2.645263671875, 2.99462890625, 3.343994140625, 3.693359375, 4.042724609375, 4.39208984375, 4.741455078125, 5.0908203125, 5.440185546875, 5.78955078125, 6.138916015625, 6.48828125, 6.837646484375, 7.18701171875, 7.536376953125, 7.8857421875, 8.235107421875, 8.58447265625, 8.933837890625, 9.283203125, 9.632568359375, 9.98193359375, 10.331298828125, 10.6806640625, 11.030029296875, 11.37939453125, 11.728759765625, 12.078125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 4.0, 13.0, 20.0, 38.0, 84.0, 133.0, 324.0, 785.0, 2243.0, 11666.0, 267467.0, 3831822.0, 70011.0, 6580.0, 1721.0, 688.0, 352.0, 130.0, 88.0, 52.0, 19.0, 8.0, 12.0, 6.0, 4.0, 5.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.25, -38.03564453125, -36.8212890625, -35.60693359375, -34.392578125, -33.17822265625, -31.9638671875, -30.74951171875, -29.53515625, -28.32080078125, -27.1064453125, -25.89208984375, -24.677734375, -23.46337890625, -22.2490234375, -21.03466796875, -19.8203125, -18.60595703125, -17.3916015625, -16.17724609375, -14.962890625, -13.74853515625, -12.5341796875, -11.31982421875, -10.10546875, -8.89111328125, -7.6767578125, -6.46240234375, -5.248046875, -4.03369140625, -2.8193359375, -1.60498046875, -0.390625, 0.82373046875, 2.0380859375, 3.25244140625, 4.466796875, 5.68115234375, 6.8955078125, 8.10986328125, 9.32421875, 10.53857421875, 11.7529296875, 12.96728515625, 14.181640625, 15.39599609375, 16.6103515625, 17.82470703125, 19.0390625, 20.25341796875, 21.4677734375, 22.68212890625, 23.896484375, 25.11083984375, 26.3251953125, 27.53955078125, 28.75390625, 29.96826171875, 31.1826171875, 32.39697265625, 33.611328125, 34.82568359375, 36.0400390625, 37.25439453125, 38.46875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 7.0, 11.0, 24.0, 46.0, 89.0, 194.0, 532.0, 1243.0, 1106.0, 433.0, 180.0, 91.0, 43.0, 23.0, 14.0, 18.0, 10.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.0625, -35.86083984375, -34.6591796875, -33.45751953125, -32.255859375, -31.05419921875, -29.8525390625, -28.65087890625, -27.44921875, -26.24755859375, -25.0458984375, -23.84423828125, -22.642578125, -21.44091796875, -20.2392578125, -19.03759765625, -17.8359375, -16.63427734375, -15.4326171875, -14.23095703125, -13.029296875, -11.82763671875, -10.6259765625, -9.42431640625, -8.22265625, -7.02099609375, -5.8193359375, -4.61767578125, -3.416015625, -2.21435546875, -1.0126953125, 0.18896484375, 1.390625, 2.59228515625, 3.7939453125, 4.99560546875, 6.197265625, 7.39892578125, 8.6005859375, 9.80224609375, 11.00390625, 12.20556640625, 13.4072265625, 14.60888671875, 15.810546875, 17.01220703125, 18.2138671875, 19.41552734375, 20.6171875, 21.81884765625, 23.0205078125, 24.22216796875, 25.423828125, 26.62548828125, 27.8271484375, 29.02880859375, 30.23046875, 31.43212890625, 32.6337890625, 33.83544921875, 35.037109375, 36.23876953125, 37.4404296875, 38.64208984375, 39.84375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 9.0, 13.0, 97.0, 444.0, 353.0, 66.0, 15.0, 4.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-237.69464111328125, -219.0989227294922, -200.50320434570312, -181.907470703125, -163.31175231933594, -144.71603393554688, -126.12030792236328, -107.52458190917969, -88.92886352539062, -70.33314514160156, -51.73741912841797, -33.14169692993164, -14.545974731445312, 4.04974365234375, 22.645469665527344, 41.24119567871094, 59.8369140625, 78.43263244628906, 97.02835845947266, 115.62408447265625, 134.2198028564453, 152.81552124023438, 171.4112548828125, 190.00697326660156, 208.60269165039062, 227.1984100341797, 245.79412841796875, 264.3898620605469, 282.985595703125, 301.581298828125, 320.1770324707031, 338.77276611328125, 357.3685302734375, 375.9642639160156, 394.5599670410156, 413.15570068359375, 431.75140380859375, 450.3471374511719, 468.94287109375, 487.53857421875, 506.1343078613281, 524.7300415039062, 543.3257446289062, 561.9214477539062, 580.5172119140625, 599.1129150390625, 617.7086181640625, 636.3043823242188, 654.9000854492188, 673.4957885742188, 692.091552734375, 710.687255859375, 729.282958984375, 747.878662109375, 766.4744262695312, 785.0701293945312, 803.6658935546875, 822.2615966796875, 840.8573608398438, 859.4530639648438, 878.0487670898438, 896.64453125, 915.240234375, 933.8359375, 952.431640625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 8.0, 5.0, 12.0, 31.0, 34.0, 37.0, 61.0, 68.0, 80.0, 85.0, 85.0, 76.0, 90.0, 73.0, 73.0, 41.0, 37.0, 38.0, 22.0, 17.0, 9.0, 11.0, 6.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-178.72216796875, -172.99313354492188, -167.26409912109375, -161.53506469726562, -155.8060302734375, -150.07699584960938, -144.34796142578125, -138.61892700195312, -132.889892578125, -127.16085815429688, -121.43182373046875, -115.70278930664062, -109.9737548828125, -104.24472045898438, -98.51567840576172, -92.7866439819336, -87.05760192871094, -81.32856750488281, -75.59953308105469, -69.87049865722656, -64.14146423339844, -58.41242599487305, -52.683387756347656, -46.95435333251953, -41.225318908691406, -35.49628448486328, -29.767248153686523, -24.038211822509766, -18.30917739868164, -12.580142974853516, -6.851104736328125, -1.1220703125, 4.606964111328125, 10.335999488830566, 16.065034866333008, 21.794071197509766, 27.52310562133789, 33.252140045166016, 38.981178283691406, 44.71021270751953, 50.439247131347656, 56.16828155517578, 61.897315979003906, 67.62635803222656, 73.35539245605469, 79.08442687988281, 84.81346130371094, 90.54249572753906, 96.27153015136719, 102.00056457519531, 107.72959899902344, 113.45863342285156, 119.18766784667969, 124.91670227050781, 130.645751953125, 136.37478637695312, 142.10382080078125, 147.83285522460938, 153.5618896484375, 159.29092407226562, 165.01995849609375, 170.74899291992188, 176.47802734375, 182.20706176757812, 187.93609619140625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 1.0, 3.0, 5.0, 6.0, 13.0, 12.0, 29.0, 31.0, 28.0, 47.0, 64.0, 121.0, 216.0, 361.0, 700.0, 1296.0, 2590.0, 6189.0, 14542.0, 38400.0, 107925.0, 272655.0, 341286.0, 165012.0, 59197.0, 21670.0, 8479.0, 3807.0, 1763.0, 922.0, 491.0, 244.0, 169.0, 103.0, 56.0, 32.0, 28.0, 14.0, 14.0, 8.0, 7.0, 7.0, 3.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-17.96875, -17.410888671875, -16.85302734375, -16.295166015625, -15.7373046875, -15.179443359375, -14.62158203125, -14.063720703125, -13.505859375, -12.947998046875, -12.39013671875, -11.832275390625, -11.2744140625, -10.716552734375, -10.15869140625, -9.600830078125, -9.04296875, -8.485107421875, -7.92724609375, -7.369384765625, -6.8115234375, -6.253662109375, -5.69580078125, -5.137939453125, -4.580078125, -4.022216796875, -3.46435546875, -2.906494140625, -2.3486328125, -1.790771484375, -1.23291015625, -0.675048828125, -0.1171875, 0.440673828125, 0.99853515625, 1.556396484375, 2.1142578125, 2.672119140625, 3.22998046875, 3.787841796875, 4.345703125, 4.903564453125, 5.46142578125, 6.019287109375, 6.5771484375, 7.135009765625, 7.69287109375, 8.250732421875, 8.80859375, 9.366455078125, 9.92431640625, 10.482177734375, 11.0400390625, 11.597900390625, 12.15576171875, 12.713623046875, 13.271484375, 13.829345703125, 14.38720703125, 14.945068359375, 15.5029296875, 16.060791015625, 16.61865234375, 17.176513671875, 17.734375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 8.0, 9.0, 5.0, 9.0, 13.0, 12.0, 14.0, 13.0, 24.0, 25.0, 39.0, 28.0, 44.0, 31.0, 44.0, 55.0, 44.0, 49.0, 64.0, 47.0, 52.0, 32.0, 46.0, 43.0, 38.0, 34.0, 35.0, 32.0, 25.0, 24.0, 12.0, 11.0, 13.0, 9.0, 13.0, 3.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2421875, -7.92236328125, -7.6025390625, -7.28271484375, -6.962890625, -6.64306640625, -6.3232421875, -6.00341796875, -5.68359375, -5.36376953125, -5.0439453125, -4.72412109375, -4.404296875, -4.08447265625, -3.7646484375, -3.44482421875, -3.125, -2.80517578125, -2.4853515625, -2.16552734375, -1.845703125, -1.52587890625, -1.2060546875, -0.88623046875, -0.56640625, -0.24658203125, 0.0732421875, 0.39306640625, 0.712890625, 1.03271484375, 1.3525390625, 1.67236328125, 1.9921875, 2.31201171875, 2.6318359375, 2.95166015625, 3.271484375, 3.59130859375, 3.9111328125, 4.23095703125, 4.55078125, 4.87060546875, 5.1904296875, 5.51025390625, 5.830078125, 6.14990234375, 6.4697265625, 6.78955078125, 7.109375, 7.42919921875, 7.7490234375, 8.06884765625, 8.388671875, 8.70849609375, 9.0283203125, 9.34814453125, 9.66796875, 9.98779296875, 10.3076171875, 10.62744140625, 10.947265625, 11.26708984375, 11.5869140625, 11.90673828125, 12.2265625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 4.0, 4.0, 3.0, 5.0, 11.0, 13.0, 16.0, 19.0, 29.0, 35.0, 46.0, 59.0, 93.0, 115.0, 199.0, 367.0, 656.0, 1334.0, 3322.0, 9454.0, 32057.0, 122665.0, 542614.0, 244125.0, 63786.0, 17602.0, 5497.0, 2086.0, 1001.0, 517.0, 261.0, 153.0, 121.0, 77.0, 49.0, 45.0, 34.0, 26.0, 18.0, 14.0, 9.0, 8.0, 2.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-17.90625, -17.211181640625, -16.51611328125, -15.821044921875, -15.1259765625, -14.430908203125, -13.73583984375, -13.040771484375, -12.345703125, -11.650634765625, -10.95556640625, -10.260498046875, -9.5654296875, -8.870361328125, -8.17529296875, -7.480224609375, -6.78515625, -6.090087890625, -5.39501953125, -4.699951171875, -4.0048828125, -3.309814453125, -2.61474609375, -1.919677734375, -1.224609375, -0.529541015625, 0.16552734375, 0.860595703125, 1.5556640625, 2.250732421875, 2.94580078125, 3.640869140625, 4.3359375, 5.031005859375, 5.72607421875, 6.421142578125, 7.1162109375, 7.811279296875, 8.50634765625, 9.201416015625, 9.896484375, 10.591552734375, 11.28662109375, 11.981689453125, 12.6767578125, 13.371826171875, 14.06689453125, 14.761962890625, 15.45703125, 16.152099609375, 16.84716796875, 17.542236328125, 18.2373046875, 18.932373046875, 19.62744140625, 20.322509765625, 21.017578125, 21.712646484375, 22.40771484375, 23.102783203125, 23.7978515625, 24.492919921875, 25.18798828125, 25.883056640625, 26.578125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 9.0, 4.0, 10.0, 6.0, 12.0, 17.0, 18.0, 21.0, 25.0, 40.0, 46.0, 45.0, 36.0, 49.0, 55.0, 65.0, 54.0, 65.0, 46.0, 63.0, 54.0, 51.0, 43.0, 29.0, 27.0, 32.0, 18.0, 14.0, 7.0, 10.0, 12.0, 5.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.5, -38.29052734375, -37.0810546875, -35.87158203125, -34.662109375, -33.45263671875, -32.2431640625, -31.03369140625, -29.82421875, -28.61474609375, -27.4052734375, -26.19580078125, -24.986328125, -23.77685546875, -22.5673828125, -21.35791015625, -20.1484375, -18.93896484375, -17.7294921875, -16.52001953125, -15.310546875, -14.10107421875, -12.8916015625, -11.68212890625, -10.47265625, -9.26318359375, -8.0537109375, -6.84423828125, -5.634765625, -4.42529296875, -3.2158203125, -2.00634765625, -0.796875, 0.41259765625, 1.6220703125, 2.83154296875, 4.041015625, 5.25048828125, 6.4599609375, 7.66943359375, 8.87890625, 10.08837890625, 11.2978515625, 12.50732421875, 13.716796875, 14.92626953125, 16.1357421875, 17.34521484375, 18.5546875, 19.76416015625, 20.9736328125, 22.18310546875, 23.392578125, 24.60205078125, 25.8115234375, 27.02099609375, 28.23046875, 29.43994140625, 30.6494140625, 31.85888671875, 33.068359375, 34.27783203125, 35.4873046875, 36.69677734375, 37.90625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 8.0, 7.0, 8.0, 11.0, 8.0, 26.0, 27.0, 36.0, 76.0, 128.0, 188.0, 353.0, 655.0, 1538.0, 4003.0, 12110.0, 43922.0, 178543.0, 595757.0, 155728.0, 38359.0, 10662.0, 3572.0, 1367.0, 659.0, 328.0, 167.0, 98.0, 64.0, 42.0, 25.0, 15.0, 11.0, 9.0, 11.0, 7.0, 4.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.3671875, -6.16473388671875, -5.9622802734375, -5.75982666015625, -5.557373046875, -5.35491943359375, -5.1524658203125, -4.95001220703125, -4.74755859375, -4.54510498046875, -4.3426513671875, -4.14019775390625, -3.937744140625, -3.73529052734375, -3.5328369140625, -3.33038330078125, -3.1279296875, -2.92547607421875, -2.7230224609375, -2.52056884765625, -2.318115234375, -2.11566162109375, -1.9132080078125, -1.71075439453125, -1.50830078125, -1.30584716796875, -1.1033935546875, -0.90093994140625, -0.698486328125, -0.49603271484375, -0.2935791015625, -0.09112548828125, 0.111328125, 0.31378173828125, 0.5162353515625, 0.71868896484375, 0.921142578125, 1.12359619140625, 1.3260498046875, 1.52850341796875, 1.73095703125, 1.93341064453125, 2.1358642578125, 2.33831787109375, 2.540771484375, 2.74322509765625, 2.9456787109375, 3.14813232421875, 3.3505859375, 3.55303955078125, 3.7554931640625, 3.95794677734375, 4.160400390625, 4.36285400390625, 4.5653076171875, 4.76776123046875, 4.97021484375, 5.17266845703125, 5.3751220703125, 5.57757568359375, 5.780029296875, 5.98248291015625, 6.1849365234375, 6.38739013671875, 6.58984375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 2.0, 3.0, 6.0, 2.0, 9.0, 11.0, 23.0, 18.0, 18.0, 39.0, 40.0, 39.0, 60.0, 62.0, 66.0, 68.0, 80.0, 80.0, 68.0, 60.0, 45.0, 43.0, 37.0, 25.0, 20.0, 18.0, 11.0, 15.0, 7.0, 6.0, 4.0, 5.0, 0.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.0021209716796875, -0.002062767744064331, -0.002004563808441162, -0.0019463598728179932, -0.0018881559371948242, -0.0018299520015716553, -0.0017717480659484863, -0.0017135441303253174, -0.0016553401947021484, -0.0015971362590789795, -0.0015389323234558105, -0.0014807283878326416, -0.0014225244522094727, -0.0013643205165863037, -0.0013061165809631348, -0.0012479126453399658, -0.0011897087097167969, -0.001131504774093628, -0.001073300838470459, -0.00101509690284729, -0.0009568929672241211, -0.0008986890316009521, -0.0008404850959777832, -0.0007822811603546143, -0.0007240772247314453, -0.0006658732891082764, -0.0006076693534851074, -0.0005494654178619385, -0.0004912614822387695, -0.0004330575466156006, -0.00037485361099243164, -0.0003166496753692627, -0.00025844573974609375, -0.0002002418041229248, -0.00014203786849975586, -8.383393287658691e-05, -2.562999725341797e-05, 3.2573938369750977e-05, 9.077787399291992e-05, 0.00014898180961608887, 0.0002071857452392578, 0.00026538968086242676, 0.0003235936164855957, 0.00038179755210876465, 0.0004400014877319336, 0.0004982054233551025, 0.0005564093589782715, 0.0006146132946014404, 0.0006728172302246094, 0.0007310211658477783, 0.0007892251014709473, 0.0008474290370941162, 0.0009056329727172852, 0.0009638369083404541, 0.001022040843963623, 0.001080244779586792, 0.001138448715209961, 0.0011966526508331299, 0.0012548565864562988, 0.0013130605220794678, 0.0013712644577026367, 0.0014294683933258057, 0.0014876723289489746, 0.0015458762645721436, 0.0016040802001953125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 6.0, 12.0, 11.0, 16.0, 16.0, 33.0, 41.0, 60.0, 79.0, 127.0, 210.0, 368.0, 637.0, 1270.0, 2914.0, 7684.0, 23761.0, 90688.0, 505349.0, 305546.0, 76759.0, 20792.0, 6778.0, 2710.0, 1167.0, 618.0, 353.0, 177.0, 100.0, 72.0, 80.0, 31.0, 27.0, 14.0, 7.0, 10.0, 8.0, 7.0, 4.0, 2.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6875, -5.48394775390625, -5.2803955078125, -5.07684326171875, -4.873291015625, -4.66973876953125, -4.4661865234375, -4.26263427734375, -4.05908203125, -3.85552978515625, -3.6519775390625, -3.44842529296875, -3.244873046875, -3.04132080078125, -2.8377685546875, -2.63421630859375, -2.4306640625, -2.22711181640625, -2.0235595703125, -1.82000732421875, -1.616455078125, -1.41290283203125, -1.2093505859375, -1.00579833984375, -0.80224609375, -0.59869384765625, -0.3951416015625, -0.19158935546875, 0.011962890625, 0.21551513671875, 0.4190673828125, 0.62261962890625, 0.826171875, 1.02972412109375, 1.2332763671875, 1.43682861328125, 1.640380859375, 1.84393310546875, 2.0474853515625, 2.25103759765625, 2.45458984375, 2.65814208984375, 2.8616943359375, 3.06524658203125, 3.268798828125, 3.47235107421875, 3.6759033203125, 3.87945556640625, 4.0830078125, 4.28656005859375, 4.4901123046875, 4.69366455078125, 4.897216796875, 5.10076904296875, 5.3043212890625, 5.50787353515625, 5.71142578125, 5.91497802734375, 6.1185302734375, 6.32208251953125, 6.525634765625, 6.72918701171875, 6.9327392578125, 7.13629150390625, 7.33984375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 7.0, 5.0, 10.0, 18.0, 6.0, 20.0, 36.0, 40.0, 41.0, 53.0, 78.0, 81.0, 79.0, 107.0, 80.0, 64.0, 68.0, 54.0, 37.0, 33.0, 21.0, 11.0, 17.0, 7.0, 10.0, 5.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.765625, -7.478759765625, -7.19189453125, -6.905029296875, -6.6181640625, -6.331298828125, -6.04443359375, -5.757568359375, -5.470703125, -5.183837890625, -4.89697265625, -4.610107421875, -4.3232421875, -4.036376953125, -3.74951171875, -3.462646484375, -3.17578125, -2.888916015625, -2.60205078125, -2.315185546875, -2.0283203125, -1.741455078125, -1.45458984375, -1.167724609375, -0.880859375, -0.593994140625, -0.30712890625, -0.020263671875, 0.2666015625, 0.553466796875, 0.84033203125, 1.127197265625, 1.4140625, 1.700927734375, 1.98779296875, 2.274658203125, 2.5615234375, 2.848388671875, 3.13525390625, 3.422119140625, 3.708984375, 3.995849609375, 4.28271484375, 4.569580078125, 4.8564453125, 5.143310546875, 5.43017578125, 5.717041015625, 6.00390625, 6.290771484375, 6.57763671875, 6.864501953125, 7.1513671875, 7.438232421875, 7.72509765625, 8.011962890625, 8.298828125, 8.585693359375, 8.87255859375, 9.159423828125, 9.4462890625, 9.733154296875, 10.02001953125, 10.306884765625, 10.59375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 9.0, 24.0, 23.0, 62.0, 135.0, 270.0, 214.0, 109.0, 65.0, 44.0, 17.0, 7.0, 4.0, 4.0, 4.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-239.19085693359375, -232.33348083496094, -225.4761199951172, -218.61874389648438, -211.76138305664062, -204.9040069580078, -198.046630859375, -191.18927001953125, -184.33189392089844, -177.47451782226562, -170.61715698242188, -163.75978088378906, -156.90240478515625, -150.0450439453125, -143.1876678466797, -136.33029174804688, -129.47293090820312, -122.61556243896484, -115.75819396972656, -108.90081787109375, -102.04344940185547, -95.18608093261719, -88.32870483398438, -81.4713363647461, -74.61396789550781, -67.75659942626953, -60.899227142333984, -54.04185485839844, -47.184486389160156, -40.327117919921875, -33.46974563598633, -26.61237335205078, -19.7550048828125, -12.897634506225586, -6.040264129638672, 0.8171062469482422, 7.674476623535156, 14.531845092773438, 21.389217376708984, 28.24658966064453, 35.10395812988281, 41.961326599121094, 48.81869888305664, 55.67607116699219, 62.53343963623047, 69.39080810546875, 76.24818420410156, 83.10555267333984, 89.96292114257812, 96.8202896118164, 103.67765808105469, 110.5350341796875, 117.39240264892578, 124.24977111816406, 131.10714721679688, 137.96450805664062, 144.82188415527344, 151.67926025390625, 158.53662109375, 165.3939971923828, 172.25137329101562, 179.10873413085938, 185.9661102294922, 192.823486328125, 199.68084716796875]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 4.0, 3.0, 8.0, 10.0, 16.0, 10.0, 16.0, 14.0, 11.0, 18.0, 29.0, 20.0, 30.0, 32.0, 27.0, 23.0, 40.0, 72.0, 65.0, 78.0, 75.0, 42.0, 48.0, 26.0, 23.0, 31.0, 29.0, 30.0, 19.0, 23.0, 15.0, 18.0, 10.0, 12.0, 13.0, 7.0, 10.0, 7.0, 4.0, 5.0, 5.0, 5.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-105.348388671875, -101.63978576660156, -97.9311752319336, -94.22256469726562, -90.51396179199219, -86.80535888671875, -83.09674835205078, -79.38813781738281, -75.67953491210938, -71.97093200683594, -68.26232147216797, -64.5537109375, -60.84510803222656, -57.13650131225586, -53.427894592285156, -49.71928787231445, -46.01068115234375, -42.30207443237305, -38.593467712402344, -34.88486099243164, -31.176254272460938, -27.467647552490234, -23.75904083251953, -20.050434112548828, -16.341827392578125, -12.633220672607422, -8.924613952636719, -5.216007232666016, -1.5074005126953125, 2.2012062072753906, 5.909812927246094, 9.618419647216797, 13.3270263671875, 17.035633087158203, 20.744239807128906, 24.45284652709961, 28.161453247070312, 31.870059967041016, 35.57866668701172, 39.28727340698242, 42.995880126953125, 46.70448684692383, 50.41309356689453, 54.121700286865234, 57.83030700683594, 61.53891372680664, 65.24752044677734, 68.95613098144531, 72.66473388671875, 76.37333679199219, 80.08194732666016, 83.79055786132812, 87.49916076660156, 91.207763671875, 94.91637420654297, 98.62498474121094, 102.33358764648438, 106.04219055175781, 109.75080108642578, 113.45941162109375, 117.16801452636719, 120.87661743164062, 124.5852279663086, 128.29383850097656, 132.00244140625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 2.0, 7.0, 9.0, 14.0, 14.0, 22.0, 24.0, 29.0, 68.0, 107.0, 154.0, 257.0, 471.0, 814.0, 1662.0, 4016.0, 11495.0, 46564.0, 341418.0, 2398519.0, 1223662.0, 130384.0, 22628.0, 6739.0, 2550.0, 1216.0, 625.0, 333.0, 170.0, 106.0, 65.0, 37.0, 30.0, 18.0, 13.0, 12.0, 14.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.171875, -13.764404296875, -13.35693359375, -12.949462890625, -12.5419921875, -12.134521484375, -11.72705078125, -11.319580078125, -10.912109375, -10.504638671875, -10.09716796875, -9.689697265625, -9.2822265625, -8.874755859375, -8.46728515625, -8.059814453125, -7.65234375, -7.244873046875, -6.83740234375, -6.429931640625, -6.0224609375, -5.614990234375, -5.20751953125, -4.800048828125, -4.392578125, -3.985107421875, -3.57763671875, -3.170166015625, -2.7626953125, -2.355224609375, -1.94775390625, -1.540283203125, -1.1328125, -0.725341796875, -0.31787109375, 0.089599609375, 0.4970703125, 0.904541015625, 1.31201171875, 1.719482421875, 2.126953125, 2.534423828125, 2.94189453125, 3.349365234375, 3.7568359375, 4.164306640625, 4.57177734375, 4.979248046875, 5.38671875, 5.794189453125, 6.20166015625, 6.609130859375, 7.0166015625, 7.424072265625, 7.83154296875, 8.239013671875, 8.646484375, 9.053955078125, 9.46142578125, 9.868896484375, 10.2763671875, 10.683837890625, 11.09130859375, 11.498779296875, 11.90625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0, 5.0, 15.0, 11.0, 22.0, 25.0, 31.0, 19.0, 40.0, 45.0, 46.0, 63.0, 44.0, 58.0, 64.0, 58.0, 45.0, 39.0, 49.0, 53.0, 45.0, 32.0, 34.0, 29.0, 29.0, 26.0, 12.0, 16.0, 8.0, 5.0, 6.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.75, -8.42724609375, -8.1044921875, -7.78173828125, -7.458984375, -7.13623046875, -6.8134765625, -6.49072265625, -6.16796875, -5.84521484375, -5.5224609375, -5.19970703125, -4.876953125, -4.55419921875, -4.2314453125, -3.90869140625, -3.5859375, -3.26318359375, -2.9404296875, -2.61767578125, -2.294921875, -1.97216796875, -1.6494140625, -1.32666015625, -1.00390625, -0.68115234375, -0.3583984375, -0.03564453125, 0.287109375, 0.60986328125, 0.9326171875, 1.25537109375, 1.578125, 1.90087890625, 2.2236328125, 2.54638671875, 2.869140625, 3.19189453125, 3.5146484375, 3.83740234375, 4.16015625, 4.48291015625, 4.8056640625, 5.12841796875, 5.451171875, 5.77392578125, 6.0966796875, 6.41943359375, 6.7421875, 7.06494140625, 7.3876953125, 7.71044921875, 8.033203125, 8.35595703125, 8.6787109375, 9.00146484375, 9.32421875, 9.64697265625, 9.9697265625, 10.29248046875, 10.615234375, 10.93798828125, 11.2607421875, 11.58349609375, 11.90625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 8.0, 9.0, 17.0, 29.0, 39.0, 96.0, 250.0, 962.0, 5636.0, 127550.0, 3968975.0, 84433.0, 4933.0, 834.0, 267.0, 113.0, 43.0, 23.0, 28.0, 10.0, 9.0, 5.0, 2.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.40625, -34.2041015625, -33.001953125, -31.7998046875, -30.59765625, -29.3955078125, -28.193359375, -26.9912109375, -25.7890625, -24.5869140625, -23.384765625, -22.1826171875, -20.98046875, -19.7783203125, -18.576171875, -17.3740234375, -16.171875, -14.9697265625, -13.767578125, -12.5654296875, -11.36328125, -10.1611328125, -8.958984375, -7.7568359375, -6.5546875, -5.3525390625, -4.150390625, -2.9482421875, -1.74609375, -0.5439453125, 0.658203125, 1.8603515625, 3.0625, 4.2646484375, 5.466796875, 6.6689453125, 7.87109375, 9.0732421875, 10.275390625, 11.4775390625, 12.6796875, 13.8818359375, 15.083984375, 16.2861328125, 17.48828125, 18.6904296875, 19.892578125, 21.0947265625, 22.296875, 23.4990234375, 24.701171875, 25.9033203125, 27.10546875, 28.3076171875, 29.509765625, 30.7119140625, 31.9140625, 33.1162109375, 34.318359375, 35.5205078125, 36.72265625, 37.9248046875, 39.126953125, 40.3291015625, 41.53125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 11.0, 10.0, 18.0, 23.0, 20.0, 51.0, 65.0, 105.0, 186.0, 306.0, 411.0, 647.0, 718.0, 557.0, 361.0, 221.0, 124.0, 69.0, 42.0, 40.0, 19.0, 15.0, 8.0, 8.0, 7.0, 7.0, 2.0, 7.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.0859375, -14.4854736328125, -13.885009765625, -13.2845458984375, -12.68408203125, -12.0836181640625, -11.483154296875, -10.8826904296875, -10.2822265625, -9.6817626953125, -9.081298828125, -8.4808349609375, -7.88037109375, -7.2799072265625, -6.679443359375, -6.0789794921875, -5.478515625, -4.8780517578125, -4.277587890625, -3.6771240234375, -3.07666015625, -2.4761962890625, -1.875732421875, -1.2752685546875, -0.6748046875, -0.0743408203125, 0.526123046875, 1.1265869140625, 1.72705078125, 2.3275146484375, 2.927978515625, 3.5284423828125, 4.12890625, 4.7293701171875, 5.329833984375, 5.9302978515625, 6.53076171875, 7.1312255859375, 7.731689453125, 8.3321533203125, 8.9326171875, 9.5330810546875, 10.133544921875, 10.7340087890625, 11.33447265625, 11.9349365234375, 12.535400390625, 13.1358642578125, 13.736328125, 14.3367919921875, 14.937255859375, 15.5377197265625, 16.13818359375, 16.7386474609375, 17.339111328125, 17.9395751953125, 18.5400390625, 19.1405029296875, 19.740966796875, 20.3414306640625, 20.94189453125, 21.5423583984375, 22.142822265625, 22.7432861328125, 23.34375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 15.0, 51.0, 222.0, 417.0, 215.0, 63.0, 11.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-193.3690185546875, -181.60992431640625, -169.850830078125, -158.0917510986328, -146.33265686035156, -134.5735626220703, -122.8144760131836, -111.05538940429688, -99.29629516601562, -87.53720092773438, -75.77811431884766, -64.01902770996094, -52.25993347167969, -40.5008430480957, -28.74175262451172, -16.982666015625, -5.22357177734375, 6.535518646240234, 18.29460906982422, 30.053699493408203, 41.81278991699219, 53.57188034057617, 65.33097076416016, 77.09005737304688, 88.84915161132812, 100.60824584960938, 112.3673324584961, 124.12641906738281, 135.88551330566406, 147.6446075439453, 159.4036865234375, 171.16278076171875, 182.921875, 194.68096923828125, 206.4400634765625, 218.1991424560547, 229.95823669433594, 241.7173309326172, 253.47640991210938, 265.2355041503906, 276.9945983886719, 288.7536926269531, 300.5127868652344, 312.2718811035156, 324.03094482421875, 335.7900390625, 347.54913330078125, 359.3082275390625, 371.06732177734375, 382.826416015625, 394.58551025390625, 406.3446044921875, 418.10369873046875, 429.8627624511719, 441.6218566894531, 453.3809509277344, 465.1400451660156, 476.8991394042969, 488.6582336425781, 500.4173278808594, 512.1763916015625, 523.9354858398438, 535.694580078125, 547.4536743164062, 559.2127685546875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 5.0, 6.0, 7.0, 8.0, 19.0, 15.0, 20.0, 16.0, 20.0, 27.0, 35.0, 38.0, 38.0, 51.0, 50.0, 44.0, 51.0, 56.0, 54.0, 44.0, 52.0, 46.0, 36.0, 45.0, 44.0, 33.0, 26.0, 22.0, 27.0, 10.0, 14.0, 7.0, 6.0, 2.0, 6.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-96.74711608886719, -93.80732727050781, -90.86753845214844, -87.92774963378906, -84.98795318603516, -82.04816436767578, -79.1083755493164, -76.16858673095703, -73.22879791259766, -70.28900909423828, -67.3492202758789, -64.409423828125, -61.46963882446289, -58.52984619140625, -55.590057373046875, -52.6502685546875, -49.71047592163086, -46.770687103271484, -43.830894470214844, -40.89110565185547, -37.951316833496094, -35.01152801513672, -32.07173538208008, -29.131946563720703, -26.192155838012695, -23.252365112304688, -20.312576293945312, -17.372785568237305, -14.432995796203613, -11.493206024169922, -8.553415298461914, -5.613626480102539, -2.6738357543945312, 0.26595425605773926, 3.2057442665100098, 6.145534515380859, 9.08532428741455, 12.025114059448242, 14.96490478515625, 17.904693603515625, 20.844484329223633, 23.78427505493164, 26.724063873291016, 29.663854598999023, 32.60364532470703, 35.543434143066406, 38.48322296142578, 41.423011779785156, 44.3628044128418, 47.30259323120117, 50.24238586425781, 53.18217468261719, 56.12196350097656, 59.06175231933594, 62.00154495239258, 64.94132995605469, 67.8811264038086, 70.82091522216797, 73.76070404052734, 76.70050048828125, 79.64028930664062, 82.580078125, 85.51986694335938, 88.45965576171875, 91.39944458007812]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 8.0, 10.0, 13.0, 11.0, 22.0, 35.0, 53.0, 107.0, 201.0, 293.0, 593.0, 1214.0, 2759.0, 6623.0, 16981.0, 47432.0, 139351.0, 344790.0, 307695.0, 116535.0, 39299.0, 14332.0, 5553.0, 2277.0, 1090.0, 527.0, 321.0, 172.0, 78.0, 62.0, 32.0, 23.0, 21.0, 14.0, 11.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.546875, -19.017333984375, -18.48779296875, -17.958251953125, -17.4287109375, -16.899169921875, -16.36962890625, -15.840087890625, -15.310546875, -14.781005859375, -14.25146484375, -13.721923828125, -13.1923828125, -12.662841796875, -12.13330078125, -11.603759765625, -11.07421875, -10.544677734375, -10.01513671875, -9.485595703125, -8.9560546875, -8.426513671875, -7.89697265625, -7.367431640625, -6.837890625, -6.308349609375, -5.77880859375, -5.249267578125, -4.7197265625, -4.190185546875, -3.66064453125, -3.131103515625, -2.6015625, -2.072021484375, -1.54248046875, -1.012939453125, -0.4833984375, 0.046142578125, 0.57568359375, 1.105224609375, 1.634765625, 2.164306640625, 2.69384765625, 3.223388671875, 3.7529296875, 4.282470703125, 4.81201171875, 5.341552734375, 5.87109375, 6.400634765625, 6.93017578125, 7.459716796875, 7.9892578125, 8.518798828125, 9.04833984375, 9.577880859375, 10.107421875, 10.636962890625, 11.16650390625, 11.696044921875, 12.2255859375, 12.755126953125, 13.28466796875, 13.814208984375, 14.34375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 5.0, 6.0, 11.0, 7.0, 17.0, 26.0, 31.0, 23.0, 28.0, 40.0, 36.0, 51.0, 53.0, 41.0, 59.0, 47.0, 55.0, 42.0, 40.0, 56.0, 37.0, 53.0, 39.0, 30.0, 34.0, 30.0, 25.0, 14.0, 14.0, 10.0, 4.0, 11.0, 4.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.234375, -7.92041015625, -7.6064453125, -7.29248046875, -6.978515625, -6.66455078125, -6.3505859375, -6.03662109375, -5.72265625, -5.40869140625, -5.0947265625, -4.78076171875, -4.466796875, -4.15283203125, -3.8388671875, -3.52490234375, -3.2109375, -2.89697265625, -2.5830078125, -2.26904296875, -1.955078125, -1.64111328125, -1.3271484375, -1.01318359375, -0.69921875, -0.38525390625, -0.0712890625, 0.24267578125, 0.556640625, 0.87060546875, 1.1845703125, 1.49853515625, 1.8125, 2.12646484375, 2.4404296875, 2.75439453125, 3.068359375, 3.38232421875, 3.6962890625, 4.01025390625, 4.32421875, 4.63818359375, 4.9521484375, 5.26611328125, 5.580078125, 5.89404296875, 6.2080078125, 6.52197265625, 6.8359375, 7.14990234375, 7.4638671875, 7.77783203125, 8.091796875, 8.40576171875, 8.7197265625, 9.03369140625, 9.34765625, 9.66162109375, 9.9755859375, 10.28955078125, 10.603515625, 10.91748046875, 11.2314453125, 11.54541015625, 11.859375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 2.0, 6.0, 3.0, 10.0, 11.0, 19.0, 26.0, 44.0, 42.0, 62.0, 94.0, 168.0, 238.0, 377.0, 673.0, 1316.0, 3671.0, 14823.0, 92687.0, 711749.0, 186403.0, 26377.0, 5765.0, 1858.0, 849.0, 434.0, 284.0, 165.0, 116.0, 85.0, 59.0, 36.0, 28.0, 14.0, 17.0, 14.0, 13.0, 6.0, 4.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-30.1875, -29.263427734375, -28.33935546875, -27.415283203125, -26.4912109375, -25.567138671875, -24.64306640625, -23.718994140625, -22.794921875, -21.870849609375, -20.94677734375, -20.022705078125, -19.0986328125, -18.174560546875, -17.25048828125, -16.326416015625, -15.40234375, -14.478271484375, -13.55419921875, -12.630126953125, -11.7060546875, -10.781982421875, -9.85791015625, -8.933837890625, -8.009765625, -7.085693359375, -6.16162109375, -5.237548828125, -4.3134765625, -3.389404296875, -2.46533203125, -1.541259765625, -0.6171875, 0.306884765625, 1.23095703125, 2.155029296875, 3.0791015625, 4.003173828125, 4.92724609375, 5.851318359375, 6.775390625, 7.699462890625, 8.62353515625, 9.547607421875, 10.4716796875, 11.395751953125, 12.31982421875, 13.243896484375, 14.16796875, 15.092041015625, 16.01611328125, 16.940185546875, 17.8642578125, 18.788330078125, 19.71240234375, 20.636474609375, 21.560546875, 22.484619140625, 23.40869140625, 24.332763671875, 25.2568359375, 26.180908203125, 27.10498046875, 28.029052734375, 28.953125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 6.0, 5.0, 8.0, 11.0, 16.0, 16.0, 24.0, 13.0, 28.0, 29.0, 34.0, 40.0, 40.0, 43.0, 59.0, 55.0, 67.0, 65.0, 41.0, 50.0, 55.0, 35.0, 34.0, 34.0, 28.0, 32.0, 30.0, 17.0, 23.0, 18.0, 9.0, 6.0, 7.0, 4.0, 4.0, 1.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-36.34375, -35.26953125, -34.1953125, -33.12109375, -32.046875, -30.97265625, -29.8984375, -28.82421875, -27.75, -26.67578125, -25.6015625, -24.52734375, -23.453125, -22.37890625, -21.3046875, -20.23046875, -19.15625, -18.08203125, -17.0078125, -15.93359375, -14.859375, -13.78515625, -12.7109375, -11.63671875, -10.5625, -9.48828125, -8.4140625, -7.33984375, -6.265625, -5.19140625, -4.1171875, -3.04296875, -1.96875, -0.89453125, 0.1796875, 1.25390625, 2.328125, 3.40234375, 4.4765625, 5.55078125, 6.625, 7.69921875, 8.7734375, 9.84765625, 10.921875, 11.99609375, 13.0703125, 14.14453125, 15.21875, 16.29296875, 17.3671875, 18.44140625, 19.515625, 20.58984375, 21.6640625, 22.73828125, 23.8125, 24.88671875, 25.9609375, 27.03515625, 28.109375, 29.18359375, 30.2578125, 31.33203125, 32.40625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 5.0, 5.0, 3.0, 11.0, 12.0, 19.0, 20.0, 53.0, 63.0, 91.0, 179.0, 321.0, 702.0, 1759.0, 4841.0, 18282.0, 94881.0, 747856.0, 144577.0, 24746.0, 6233.0, 2149.0, 866.0, 361.0, 196.0, 126.0, 55.0, 40.0, 31.0, 25.0, 15.0, 9.0, 6.0, 4.0, 6.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3671875, -9.07080078125, -8.7744140625, -8.47802734375, -8.181640625, -7.88525390625, -7.5888671875, -7.29248046875, -6.99609375, -6.69970703125, -6.4033203125, -6.10693359375, -5.810546875, -5.51416015625, -5.2177734375, -4.92138671875, -4.625, -4.32861328125, -4.0322265625, -3.73583984375, -3.439453125, -3.14306640625, -2.8466796875, -2.55029296875, -2.25390625, -1.95751953125, -1.6611328125, -1.36474609375, -1.068359375, -0.77197265625, -0.4755859375, -0.17919921875, 0.1171875, 0.41357421875, 0.7099609375, 1.00634765625, 1.302734375, 1.59912109375, 1.8955078125, 2.19189453125, 2.48828125, 2.78466796875, 3.0810546875, 3.37744140625, 3.673828125, 3.97021484375, 4.2666015625, 4.56298828125, 4.859375, 5.15576171875, 5.4521484375, 5.74853515625, 6.044921875, 6.34130859375, 6.6376953125, 6.93408203125, 7.23046875, 7.52685546875, 7.8232421875, 8.11962890625, 8.416015625, 8.71240234375, 9.0087890625, 9.30517578125, 9.6015625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 7.0, 14.0, 11.0, 8.0, 25.0, 31.0, 35.0, 57.0, 88.0, 91.0, 139.0, 131.0, 92.0, 80.0, 52.0, 40.0, 23.0, 17.0, 17.0, 14.0, 11.0, 6.0, 4.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0031604766845703125, -0.0030676722526550293, -0.002974867820739746, -0.002882063388824463, -0.0027892589569091797, -0.0026964545249938965, -0.0026036500930786133, -0.00251084566116333, -0.002418041229248047, -0.0023252367973327637, -0.0022324323654174805, -0.0021396279335021973, -0.002046823501586914, -0.001954019069671631, -0.0018612146377563477, -0.0017684102058410645, -0.0016756057739257812, -0.001582801342010498, -0.0014899969100952148, -0.0013971924781799316, -0.0013043880462646484, -0.0012115836143493652, -0.001118779182434082, -0.0010259747505187988, -0.0009331703186035156, -0.0008403658866882324, -0.0007475614547729492, -0.000654757022857666, -0.0005619525909423828, -0.0004691481590270996, -0.0003763437271118164, -0.0002835392951965332, -0.00019073486328125, -9.79304313659668e-05, -5.125999450683594e-06, 8.767843246459961e-05, 0.0001804828643798828, 0.000273287296295166, 0.0003660917282104492, 0.0004588961601257324, 0.0005517005920410156, 0.0006445050239562988, 0.000737309455871582, 0.0008301138877868652, 0.0009229183197021484, 0.0010157227516174316, 0.0011085271835327148, 0.001201331615447998, 0.0012941360473632812, 0.0013869404792785645, 0.0014797449111938477, 0.0015725493431091309, 0.001665353775024414, 0.0017581582069396973, 0.0018509626388549805, 0.0019437670707702637, 0.002036571502685547, 0.00212937593460083, 0.0022221803665161133, 0.0023149847984313965, 0.0024077892303466797, 0.002500593662261963, 0.002593398094177246, 0.0026862025260925293, 0.0027790069580078125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 8.0, 6.0, 11.0, 18.0, 34.0, 54.0, 115.0, 176.0, 365.0, 983.0, 3104.0, 15342.0, 179609.0, 795096.0, 44550.0, 6291.0, 1643.0, 584.0, 243.0, 137.0, 63.0, 52.0, 18.0, 15.0, 7.0, 4.0, 9.0, 3.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.453125, -12.0545654296875, -11.656005859375, -11.2574462890625, -10.85888671875, -10.4603271484375, -10.061767578125, -9.6632080078125, -9.2646484375, -8.8660888671875, -8.467529296875, -8.0689697265625, -7.67041015625, -7.2718505859375, -6.873291015625, -6.4747314453125, -6.076171875, -5.6776123046875, -5.279052734375, -4.8804931640625, -4.48193359375, -4.0833740234375, -3.684814453125, -3.2862548828125, -2.8876953125, -2.4891357421875, -2.090576171875, -1.6920166015625, -1.29345703125, -0.8948974609375, -0.496337890625, -0.0977783203125, 0.30078125, 0.6993408203125, 1.097900390625, 1.4964599609375, 1.89501953125, 2.2935791015625, 2.692138671875, 3.0906982421875, 3.4892578125, 3.8878173828125, 4.286376953125, 4.6849365234375, 5.08349609375, 5.4820556640625, 5.880615234375, 6.2791748046875, 6.677734375, 7.0762939453125, 7.474853515625, 7.8734130859375, 8.27197265625, 8.6705322265625, 9.069091796875, 9.4676513671875, 9.8662109375, 10.2647705078125, 10.663330078125, 11.0618896484375, 11.46044921875, 11.8590087890625, 12.257568359375, 12.6561279296875, 13.0546875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 3.0, 4.0, 9.0, 10.0, 12.0, 14.0, 11.0, 22.0, 19.0, 33.0, 43.0, 76.0, 82.0, 91.0, 79.0, 103.0, 81.0, 55.0, 65.0, 49.0, 26.0, 26.0, 20.0, 16.0, 8.0, 11.0, 2.0, 3.0, 5.0, 1.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.53125, -6.2720947265625, -6.012939453125, -5.7537841796875, -5.49462890625, -5.2354736328125, -4.976318359375, -4.7171630859375, -4.4580078125, -4.1988525390625, -3.939697265625, -3.6805419921875, -3.42138671875, -3.1622314453125, -2.903076171875, -2.6439208984375, -2.384765625, -2.1256103515625, -1.866455078125, -1.6072998046875, -1.34814453125, -1.0889892578125, -0.829833984375, -0.5706787109375, -0.3115234375, -0.0523681640625, 0.206787109375, 0.4659423828125, 0.72509765625, 0.9842529296875, 1.243408203125, 1.5025634765625, 1.76171875, 2.0208740234375, 2.280029296875, 2.5391845703125, 2.79833984375, 3.0574951171875, 3.316650390625, 3.5758056640625, 3.8349609375, 4.0941162109375, 4.353271484375, 4.6124267578125, 4.87158203125, 5.1307373046875, 5.389892578125, 5.6490478515625, 5.908203125, 6.1673583984375, 6.426513671875, 6.6856689453125, 6.94482421875, 7.2039794921875, 7.463134765625, 7.7222900390625, 7.9814453125, 8.2406005859375, 8.499755859375, 8.7589111328125, 9.01806640625, 9.2772216796875, 9.536376953125, 9.7955322265625, 10.0546875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 6.0, 10.0, 25.0, 29.0, 49.0, 80.0, 104.0, 207.0, 211.0, 84.0, 75.0, 39.0, 19.0, 20.0, 6.0, 9.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-176.8946533203125, -171.97991943359375, -167.06517028808594, -162.15042114257812, -157.23568725585938, -152.32095336914062, -147.4062042236328, -142.491455078125, -137.57672119140625, -132.6619873046875, -127.74723815917969, -122.8324966430664, -117.91775512695312, -113.00301361083984, -108.08827209472656, -103.17353057861328, -98.2587890625, -93.34404754638672, -88.42930603027344, -83.51456451416016, -78.59982299804688, -73.6850814819336, -68.77033996582031, -63.85559844970703, -58.94085693359375, -54.02611541748047, -49.11137390136719, -44.196632385253906, -39.281890869140625, -34.367149353027344, -29.452407836914062, -24.53766632080078, -19.6229248046875, -14.708183288574219, -9.793441772460938, -4.878700256347656, 0.036041259765625, 4.950782775878906, 9.865524291992188, 14.780265808105469, 19.69500732421875, 24.60974884033203, 29.524490356445312, 34.439231872558594, 39.353973388671875, 44.268714904785156, 49.18345642089844, 54.09819793701172, 59.012939453125, 63.92768096923828, 68.84242248535156, 73.75716400146484, 78.67190551757812, 83.5866470336914, 88.50138854980469, 93.41613006591797, 98.33087158203125, 103.24561309814453, 108.16035461425781, 113.0750961303711, 117.98983764648438, 122.90457916259766, 127.81932067871094, 132.73406982421875, 137.6488037109375]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 4.0, 12.0, 9.0, 6.0, 12.0, 10.0, 17.0, 14.0, 15.0, 10.0, 27.0, 19.0, 34.0, 37.0, 32.0, 30.0, 40.0, 62.0, 85.0, 86.0, 70.0, 41.0, 33.0, 32.0, 30.0, 23.0, 28.0, 25.0, 24.0, 17.0, 14.0, 9.0, 12.0, 10.0, 19.0, 7.0, 9.0, 4.0, 5.0, 6.0, 3.0, 0.0, 1.0, 4.0, 4.0, 3.0, 2.0, 1.0], "bins": [-126.7812728881836, -123.16165924072266, -119.54205322265625, -115.92243957519531, -112.30282592773438, -108.68321990966797, -105.06360626220703, -101.44400024414062, -97.82438659667969, -94.20477294921875, -90.58516693115234, -86.9655532836914, -83.345947265625, -79.72633361816406, -76.10671997070312, -72.48710632324219, -68.86750030517578, -65.24788665771484, -61.62828063964844, -58.0086669921875, -54.38905715942383, -50.769447326660156, -47.14983367919922, -43.53022384643555, -39.910614013671875, -36.2910041809082, -32.67139434814453, -29.051780700683594, -25.432170867919922, -21.81256103515625, -18.192949295043945, -14.57333755493164, -10.953727722167969, -7.3341169357299805, -3.714506149291992, -0.0948953628540039, 3.5247154235839844, 7.144325256347656, 10.763936996459961, 14.383548736572266, 18.003158569335938, 21.62276840209961, 25.242380142211914, 28.86199188232422, 32.48160171508789, 36.10121154785156, 39.7208251953125, 43.34043502807617, 46.960044860839844, 50.579654693603516, 54.19926452636719, 57.818878173828125, 61.4384880065918, 65.05809783935547, 68.6777114868164, 72.29731750488281, 75.91693115234375, 79.53654479980469, 83.1561508178711, 86.77576446533203, 90.39537048339844, 94.01498413085938, 97.63459777832031, 101.25421142578125, 104.87381744384766]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 4.0, 3.0, 3.0, 9.0, 12.0, 13.0, 10.0, 28.0, 44.0, 91.0, 125.0, 300.0, 601.0, 1433.0, 3915.0, 14236.0, 82451.0, 832472.0, 2692426.0, 498595.0, 52199.0, 10089.0, 3047.0, 1151.0, 487.0, 261.0, 122.0, 53.0, 42.0, 27.0, 7.0, 9.0, 6.0, 6.0, 2.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5546875, -13.0772705078125, -12.599853515625, -12.1224365234375, -11.64501953125, -11.1676025390625, -10.690185546875, -10.2127685546875, -9.7353515625, -9.2579345703125, -8.780517578125, -8.3031005859375, -7.82568359375, -7.3482666015625, -6.870849609375, -6.3934326171875, -5.916015625, -5.4385986328125, -4.961181640625, -4.4837646484375, -4.00634765625, -3.5289306640625, -3.051513671875, -2.5740966796875, -2.0966796875, -1.6192626953125, -1.141845703125, -0.6644287109375, -0.18701171875, 0.2904052734375, 0.767822265625, 1.2452392578125, 1.72265625, 2.2000732421875, 2.677490234375, 3.1549072265625, 3.63232421875, 4.1097412109375, 4.587158203125, 5.0645751953125, 5.5419921875, 6.0194091796875, 6.496826171875, 6.9742431640625, 7.45166015625, 7.9290771484375, 8.406494140625, 8.8839111328125, 9.361328125, 9.8387451171875, 10.316162109375, 10.7935791015625, 11.27099609375, 11.7484130859375, 12.225830078125, 12.7032470703125, 13.1806640625, 13.6580810546875, 14.135498046875, 14.6129150390625, 15.09033203125, 15.5677490234375, 16.045166015625, 16.5225830078125, 17.0]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 5.0, 5.0, 15.0, 9.0, 17.0, 20.0, 21.0, 36.0, 24.0, 37.0, 41.0, 40.0, 49.0, 50.0, 51.0, 53.0, 59.0, 45.0, 47.0, 54.0, 37.0, 43.0, 39.0, 37.0, 33.0, 22.0, 27.0, 30.0, 12.0, 12.0, 11.0, 6.0, 5.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.40625, -8.101318359375, -7.79638671875, -7.491455078125, -7.1865234375, -6.881591796875, -6.57666015625, -6.271728515625, -5.966796875, -5.661865234375, -5.35693359375, -5.052001953125, -4.7470703125, -4.442138671875, -4.13720703125, -3.832275390625, -3.52734375, -3.222412109375, -2.91748046875, -2.612548828125, -2.3076171875, -2.002685546875, -1.69775390625, -1.392822265625, -1.087890625, -0.782958984375, -0.47802734375, -0.173095703125, 0.1318359375, 0.436767578125, 0.74169921875, 1.046630859375, 1.3515625, 1.656494140625, 1.96142578125, 2.266357421875, 2.5712890625, 2.876220703125, 3.18115234375, 3.486083984375, 3.791015625, 4.095947265625, 4.40087890625, 4.705810546875, 5.0107421875, 5.315673828125, 5.62060546875, 5.925537109375, 6.23046875, 6.535400390625, 6.84033203125, 7.145263671875, 7.4501953125, 7.755126953125, 8.06005859375, 8.364990234375, 8.669921875, 8.974853515625, 9.27978515625, 9.584716796875, 9.8896484375, 10.194580078125, 10.49951171875, 10.804443359375, 11.109375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 2.0, 7.0, 14.0, 23.0, 25.0, 61.0, 104.0, 209.0, 538.0, 1659.0, 15120.0, 1618338.0, 2536658.0, 18660.0, 1913.0, 528.0, 200.0, 104.0, 46.0, 35.0, 13.0, 16.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.34375, -36.140625, -34.9375, -33.734375, -32.53125, -31.328125, -30.125, -28.921875, -27.71875, -26.515625, -25.3125, -24.109375, -22.90625, -21.703125, -20.5, -19.296875, -18.09375, -16.890625, -15.6875, -14.484375, -13.28125, -12.078125, -10.875, -9.671875, -8.46875, -7.265625, -6.0625, -4.859375, -3.65625, -2.453125, -1.25, -0.046875, 1.15625, 2.359375, 3.5625, 4.765625, 5.96875, 7.171875, 8.375, 9.578125, 10.78125, 11.984375, 13.1875, 14.390625, 15.59375, 16.796875, 18.0, 19.203125, 20.40625, 21.609375, 22.8125, 24.015625, 25.21875, 26.421875, 27.625, 28.828125, 30.03125, 31.234375, 32.4375, 33.640625, 34.84375, 36.046875, 37.25, 38.453125, 39.65625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 10.0, 25.0, 12.0, 39.0, 80.0, 123.0, 194.0, 329.0, 580.0, 783.0, 778.0, 464.0, 279.0, 156.0, 82.0, 51.0, 31.0, 21.0, 8.0, 7.0, 10.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.296875, -25.470703125, -24.64453125, -23.818359375, -22.9921875, -22.166015625, -21.33984375, -20.513671875, -19.6875, -18.861328125, -18.03515625, -17.208984375, -16.3828125, -15.556640625, -14.73046875, -13.904296875, -13.078125, -12.251953125, -11.42578125, -10.599609375, -9.7734375, -8.947265625, -8.12109375, -7.294921875, -6.46875, -5.642578125, -4.81640625, -3.990234375, -3.1640625, -2.337890625, -1.51171875, -0.685546875, 0.140625, 0.966796875, 1.79296875, 2.619140625, 3.4453125, 4.271484375, 5.09765625, 5.923828125, 6.75, 7.576171875, 8.40234375, 9.228515625, 10.0546875, 10.880859375, 11.70703125, 12.533203125, 13.359375, 14.185546875, 15.01171875, 15.837890625, 16.6640625, 17.490234375, 18.31640625, 19.142578125, 19.96875, 20.794921875, 21.62109375, 22.447265625, 23.2734375, 24.099609375, 24.92578125, 25.751953125, 26.578125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 8.0, 14.0, 27.0, 33.0, 70.0, 127.0, 183.0, 209.0, 153.0, 89.0, 42.0, 18.0, 13.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-245.51455688476562, -239.55516052246094, -233.5957794189453, -227.63638305664062, -221.677001953125, -215.7176055908203, -209.75820922851562, -203.798828125, -197.8394317626953, -191.88003540039062, -185.920654296875, -179.9612579345703, -174.00186157226562, -168.04248046875, -162.0830841064453, -156.12368774414062, -150.164306640625, -144.2049102783203, -138.2455291748047, -132.2861328125, -126.32674407958984, -120.36735534667969, -114.407958984375, -108.44857025146484, -102.48918151855469, -96.52979278564453, -90.57040405273438, -84.61100769042969, -78.65161895751953, -72.69223022460938, -66.73283386230469, -60.77344512939453, -54.81404113769531, -48.854652404785156, -42.895259857177734, -36.93586730957031, -30.976478576660156, -25.017087936401367, -19.057697296142578, -13.098304748535156, -7.138916015625, -1.179525375366211, 4.779865264892578, 10.739255905151367, 16.698646545410156, 22.658037185668945, 28.617427825927734, 34.576820373535156, 40.53620910644531, 46.49559783935547, 52.45499038696289, 58.41438293457031, 64.37377166748047, 70.33316040039062, 76.29255676269531, 82.25194549560547, 88.21133422851562, 94.17072296142578, 100.13011169433594, 106.08950805664062, 112.04889678955078, 118.00828552246094, 123.96768188476562, 129.92706298828125, 135.88645935058594]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 5.0, 10.0, 7.0, 8.0, 9.0, 7.0, 8.0, 10.0, 17.0, 16.0, 18.0, 25.0, 29.0, 32.0, 23.0, 37.0, 38.0, 46.0, 37.0, 42.0, 57.0, 46.0, 59.0, 42.0, 41.0, 39.0, 33.0, 39.0, 24.0, 27.0, 28.0, 28.0, 15.0, 13.0, 12.0, 19.0, 9.0, 3.0, 9.0, 10.0, 4.0, 7.0, 5.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-77.25106811523438, -74.7386703491211, -72.22626495361328, -69.7138671875, -67.20146942138672, -64.68907165527344, -62.176666259765625, -59.664268493652344, -57.1518669128418, -54.63946533203125, -52.12706756591797, -49.61466598510742, -47.102264404296875, -44.589866638183594, -42.07746505737305, -39.5650634765625, -37.05266571044922, -34.54026412963867, -32.02786636352539, -29.515464782714844, -27.00306510925293, -24.490665435791016, -21.97826385498047, -19.465864181518555, -16.95346450805664, -14.441064834594727, -11.928664207458496, -9.416263580322266, -6.903863906860352, -4.3914642333984375, -1.879063606262207, 0.6333370208740234, 3.1457366943359375, 5.65813684463501, 8.170536994934082, 10.682937622070312, 13.195337295532227, 15.70773696899414, 18.220138549804688, 20.7325382232666, 23.244937896728516, 25.75733757019043, 28.269737243652344, 30.78213882446289, 33.29454040527344, 35.80693817138672, 38.319339752197266, 40.83174133300781, 43.344139099121094, 45.85654067993164, 48.36893844604492, 50.88134002685547, 53.39373779296875, 55.9061393737793, 58.418540954589844, 60.930938720703125, 63.44334030151367, 65.95574188232422, 68.4681396484375, 70.98053741455078, 73.4929428100586, 76.00534057617188, 78.51773834228516, 81.03014373779297, 83.54254150390625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 11.0, 10.0, 9.0, 17.0, 37.0, 51.0, 71.0, 144.0, 229.0, 394.0, 828.0, 1588.0, 3370.0, 7629.0, 18632.0, 48696.0, 142988.0, 374791.0, 290977.0, 98418.0, 34915.0, 13662.0, 5752.0, 2697.0, 1226.0, 638.0, 343.0, 156.0, 109.0, 55.0, 36.0, 30.0, 21.0, 12.0, 6.0, 8.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.765625, -13.18798828125, -12.6103515625, -12.03271484375, -11.455078125, -10.87744140625, -10.2998046875, -9.72216796875, -9.14453125, -8.56689453125, -7.9892578125, -7.41162109375, -6.833984375, -6.25634765625, -5.6787109375, -5.10107421875, -4.5234375, -3.94580078125, -3.3681640625, -2.79052734375, -2.212890625, -1.63525390625, -1.0576171875, -0.47998046875, 0.09765625, 0.67529296875, 1.2529296875, 1.83056640625, 2.408203125, 2.98583984375, 3.5634765625, 4.14111328125, 4.71875, 5.29638671875, 5.8740234375, 6.45166015625, 7.029296875, 7.60693359375, 8.1845703125, 8.76220703125, 9.33984375, 9.91748046875, 10.4951171875, 11.07275390625, 11.650390625, 12.22802734375, 12.8056640625, 13.38330078125, 13.9609375, 14.53857421875, 15.1162109375, 15.69384765625, 16.271484375, 16.84912109375, 17.4267578125, 18.00439453125, 18.58203125, 19.15966796875, 19.7373046875, 20.31494140625, 20.892578125, 21.47021484375, 22.0478515625, 22.62548828125, 23.203125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 6.0, 4.0, 11.0, 6.0, 14.0, 21.0, 20.0, 24.0, 35.0, 29.0, 32.0, 50.0, 42.0, 58.0, 55.0, 44.0, 57.0, 49.0, 47.0, 51.0, 46.0, 46.0, 41.0, 41.0, 29.0, 34.0, 23.0, 20.0, 16.0, 10.0, 11.0, 6.0, 4.0, 5.0, 8.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6015625, -9.2796630859375, -8.957763671875, -8.6358642578125, -8.31396484375, -7.9920654296875, -7.670166015625, -7.3482666015625, -7.0263671875, -6.7044677734375, -6.382568359375, -6.0606689453125, -5.73876953125, -5.4168701171875, -5.094970703125, -4.7730712890625, -4.451171875, -4.1292724609375, -3.807373046875, -3.4854736328125, -3.16357421875, -2.8416748046875, -2.519775390625, -2.1978759765625, -1.8759765625, -1.5540771484375, -1.232177734375, -0.9102783203125, -0.58837890625, -0.2664794921875, 0.055419921875, 0.3773193359375, 0.69921875, 1.0211181640625, 1.343017578125, 1.6649169921875, 1.98681640625, 2.3087158203125, 2.630615234375, 2.9525146484375, 3.2744140625, 3.5963134765625, 3.918212890625, 4.2401123046875, 4.56201171875, 4.8839111328125, 5.205810546875, 5.5277099609375, 5.849609375, 6.1715087890625, 6.493408203125, 6.8153076171875, 7.13720703125, 7.4591064453125, 7.781005859375, 8.1029052734375, 8.4248046875, 8.7467041015625, 9.068603515625, 9.3905029296875, 9.71240234375, 10.0343017578125, 10.356201171875, 10.6781005859375, 11.0]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 12.0, 14.0, 23.0, 27.0, 34.0, 39.0, 58.0, 78.0, 116.0, 158.0, 235.0, 348.0, 555.0, 965.0, 1898.0, 5513.0, 26097.0, 243541.0, 709300.0, 46050.0, 7935.0, 2547.0, 1139.0, 646.0, 382.0, 254.0, 183.0, 110.0, 74.0, 66.0, 48.0, 24.0, 21.0, 19.0, 9.0, 14.0, 2.0, 3.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.96875, -26.9384765625, -25.908203125, -24.8779296875, -23.84765625, -22.8173828125, -21.787109375, -20.7568359375, -19.7265625, -18.6962890625, -17.666015625, -16.6357421875, -15.60546875, -14.5751953125, -13.544921875, -12.5146484375, -11.484375, -10.4541015625, -9.423828125, -8.3935546875, -7.36328125, -6.3330078125, -5.302734375, -4.2724609375, -3.2421875, -2.2119140625, -1.181640625, -0.1513671875, 0.87890625, 1.9091796875, 2.939453125, 3.9697265625, 5.0, 6.0302734375, 7.060546875, 8.0908203125, 9.12109375, 10.1513671875, 11.181640625, 12.2119140625, 13.2421875, 14.2724609375, 15.302734375, 16.3330078125, 17.36328125, 18.3935546875, 19.423828125, 20.4541015625, 21.484375, 22.5146484375, 23.544921875, 24.5751953125, 25.60546875, 26.6357421875, 27.666015625, 28.6962890625, 29.7265625, 30.7568359375, 31.787109375, 32.8173828125, 33.84765625, 34.8779296875, 35.908203125, 36.9384765625, 37.96875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 6.0, 6.0, 6.0, 10.0, 17.0, 12.0, 12.0, 15.0, 17.0, 30.0, 34.0, 28.0, 50.0, 52.0, 66.0, 73.0, 71.0, 80.0, 59.0, 43.0, 52.0, 45.0, 46.0, 31.0, 29.0, 19.0, 19.0, 13.0, 17.0, 7.0, 9.0, 10.0, 6.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-45.03125, -43.79638671875, -42.5615234375, -41.32666015625, -40.091796875, -38.85693359375, -37.6220703125, -36.38720703125, -35.15234375, -33.91748046875, -32.6826171875, -31.44775390625, -30.212890625, -28.97802734375, -27.7431640625, -26.50830078125, -25.2734375, -24.03857421875, -22.8037109375, -21.56884765625, -20.333984375, -19.09912109375, -17.8642578125, -16.62939453125, -15.39453125, -14.15966796875, -12.9248046875, -11.68994140625, -10.455078125, -9.22021484375, -7.9853515625, -6.75048828125, -5.515625, -4.28076171875, -3.0458984375, -1.81103515625, -0.576171875, 0.65869140625, 1.8935546875, 3.12841796875, 4.36328125, 5.59814453125, 6.8330078125, 8.06787109375, 9.302734375, 10.53759765625, 11.7724609375, 13.00732421875, 14.2421875, 15.47705078125, 16.7119140625, 17.94677734375, 19.181640625, 20.41650390625, 21.6513671875, 22.88623046875, 24.12109375, 25.35595703125, 26.5908203125, 27.82568359375, 29.060546875, 30.29541015625, 31.5302734375, 32.76513671875, 34.0]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 4.0, 8.0, 9.0, 14.0, 14.0, 26.0, 27.0, 39.0, 60.0, 68.0, 125.0, 183.0, 334.0, 684.0, 1403.0, 3907.0, 15241.0, 107301.0, 807109.0, 91862.0, 13727.0, 3648.0, 1266.0, 599.0, 319.0, 184.0, 123.0, 68.0, 48.0, 37.0, 24.0, 23.0, 15.0, 13.0, 10.0, 8.0, 7.0, 5.0, 1.0, 3.0, 3.0, 1.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5, -9.224365234375, -8.94873046875, -8.673095703125, -8.3974609375, -8.121826171875, -7.84619140625, -7.570556640625, -7.294921875, -7.019287109375, -6.74365234375, -6.468017578125, -6.1923828125, -5.916748046875, -5.64111328125, -5.365478515625, -5.08984375, -4.814208984375, -4.53857421875, -4.262939453125, -3.9873046875, -3.711669921875, -3.43603515625, -3.160400390625, -2.884765625, -2.609130859375, -2.33349609375, -2.057861328125, -1.7822265625, -1.506591796875, -1.23095703125, -0.955322265625, -0.6796875, -0.404052734375, -0.12841796875, 0.147216796875, 0.4228515625, 0.698486328125, 0.97412109375, 1.249755859375, 1.525390625, 1.801025390625, 2.07666015625, 2.352294921875, 2.6279296875, 2.903564453125, 3.17919921875, 3.454833984375, 3.73046875, 4.006103515625, 4.28173828125, 4.557373046875, 4.8330078125, 5.108642578125, 5.38427734375, 5.659912109375, 5.935546875, 6.211181640625, 6.48681640625, 6.762451171875, 7.0380859375, 7.313720703125, 7.58935546875, 7.864990234375, 8.140625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 4.0, 3.0, 5.0, 7.0, 4.0, 2.0, 5.0, 6.0, 14.0, 17.0, 20.0, 22.0, 26.0, 42.0, 56.0, 60.0, 83.0, 101.0, 109.0, 74.0, 73.0, 60.0, 42.0, 38.0, 25.0, 24.0, 10.0, 10.0, 14.0, 10.0, 4.0, 9.0, 4.0, 5.0, 6.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0021152496337890625, -0.0020510852336883545, -0.0019869208335876465, -0.0019227564334869385, -0.0018585920333862305, -0.0017944276332855225, -0.0017302632331848145, -0.0016660988330841064, -0.0016019344329833984, -0.0015377700328826904, -0.0014736056327819824, -0.0014094412326812744, -0.0013452768325805664, -0.0012811124324798584, -0.0012169480323791504, -0.0011527836322784424, -0.0010886192321777344, -0.0010244548320770264, -0.0009602904319763184, -0.0008961260318756104, -0.0008319616317749023, -0.0007677972316741943, -0.0007036328315734863, -0.0006394684314727783, -0.0005753040313720703, -0.0005111396312713623, -0.0004469752311706543, -0.0003828108310699463, -0.0003186464309692383, -0.0002544820308685303, -0.00019031763076782227, -0.00012615323066711426, -6.198883056640625e-05, 2.175569534301758e-06, 6.633996963500977e-05, 0.00013050436973571777, 0.00019466876983642578, 0.0002588331699371338, 0.0003229975700378418, 0.0003871619701385498, 0.0004513263702392578, 0.0005154907703399658, 0.0005796551704406738, 0.0006438195705413818, 0.0007079839706420898, 0.0007721483707427979, 0.0008363127708435059, 0.0009004771709442139, 0.0009646415710449219, 0.0010288059711456299, 0.0010929703712463379, 0.001157134771347046, 0.001221299171447754, 0.001285463571548462, 0.00134962797164917, 0.001413792371749878, 0.001477956771850586, 0.001542121171951294, 0.001606285572052002, 0.00167044997215271, 0.001734614372253418, 0.001798778772354126, 0.001862943172454834, 0.001927107572555542, 0.00199127197265625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 11.0, 10.0, 17.0, 35.0, 46.0, 78.0, 151.0, 252.0, 444.0, 977.0, 2767.0, 12087.0, 108585.0, 827395.0, 81454.0, 9918.0, 2409.0, 899.0, 467.0, 221.0, 118.0, 68.0, 44.0, 37.0, 23.0, 7.0, 8.0, 8.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.890625, -9.611572265625, -9.33251953125, -9.053466796875, -8.7744140625, -8.495361328125, -8.21630859375, -7.937255859375, -7.658203125, -7.379150390625, -7.10009765625, -6.821044921875, -6.5419921875, -6.262939453125, -5.98388671875, -5.704833984375, -5.42578125, -5.146728515625, -4.86767578125, -4.588623046875, -4.3095703125, -4.030517578125, -3.75146484375, -3.472412109375, -3.193359375, -2.914306640625, -2.63525390625, -2.356201171875, -2.0771484375, -1.798095703125, -1.51904296875, -1.239990234375, -0.9609375, -0.681884765625, -0.40283203125, -0.123779296875, 0.1552734375, 0.434326171875, 0.71337890625, 0.992431640625, 1.271484375, 1.550537109375, 1.82958984375, 2.108642578125, 2.3876953125, 2.666748046875, 2.94580078125, 3.224853515625, 3.50390625, 3.782958984375, 4.06201171875, 4.341064453125, 4.6201171875, 4.899169921875, 5.17822265625, 5.457275390625, 5.736328125, 6.015380859375, 6.29443359375, 6.573486328125, 6.8525390625, 7.131591796875, 7.41064453125, 7.689697265625, 7.96875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 3.0, 2.0, 4.0, 9.0, 20.0, 18.0, 22.0, 23.0, 36.0, 55.0, 70.0, 79.0, 110.0, 141.0, 109.0, 84.0, 54.0, 36.0, 29.0, 29.0, 17.0, 20.0, 10.0, 5.0, 5.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.078125, -10.80279541015625, -10.5274658203125, -10.25213623046875, -9.976806640625, -9.70147705078125, -9.4261474609375, -9.15081787109375, -8.87548828125, -8.60015869140625, -8.3248291015625, -8.04949951171875, -7.774169921875, -7.49884033203125, -7.2235107421875, -6.94818115234375, -6.6728515625, -6.39752197265625, -6.1221923828125, -5.84686279296875, -5.571533203125, -5.29620361328125, -5.0208740234375, -4.74554443359375, -4.47021484375, -4.19488525390625, -3.9195556640625, -3.64422607421875, -3.368896484375, -3.09356689453125, -2.8182373046875, -2.54290771484375, -2.267578125, -1.99224853515625, -1.7169189453125, -1.44158935546875, -1.166259765625, -0.89093017578125, -0.6156005859375, -0.34027099609375, -0.06494140625, 0.21038818359375, 0.4857177734375, 0.76104736328125, 1.036376953125, 1.31170654296875, 1.5870361328125, 1.86236572265625, 2.1376953125, 2.41302490234375, 2.6883544921875, 2.96368408203125, 3.239013671875, 3.51434326171875, 3.7896728515625, 4.06500244140625, 4.34033203125, 4.61566162109375, 4.8909912109375, 5.16632080078125, 5.441650390625, 5.71697998046875, 5.9923095703125, 6.26763916015625, 6.54296875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 6.0, 5.0, 17.0, 71.0, 303.0, 500.0, 84.0, 17.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-385.83050537109375, -369.12396240234375, -352.4174499511719, -335.7109375, -319.00439453125, -302.2978515625, -285.5913391113281, -268.88482666015625, -252.17828369140625, -235.4717559814453, -218.76522827148438, -202.05870056152344, -185.3521728515625, -168.64564514160156, -151.93911743164062, -135.2325897216797, -118.52606201171875, -101.81953430175781, -85.11300659179688, -68.40647888183594, -51.699951171875, -34.99342346191406, -18.286895751953125, -1.5803680419921875, 15.12615966796875, 31.832687377929688, 48.539215087890625, 65.24574279785156, 81.9522705078125, 98.65879821777344, 115.36532592773438, 132.0718536376953, 148.77838134765625, 165.4849090576172, 182.19143676757812, 198.89796447753906, 215.6044921875, 232.31101989746094, 249.01754760742188, 265.72406005859375, 282.43060302734375, 299.13714599609375, 315.8436584472656, 332.5501708984375, 349.2567138671875, 365.9632568359375, 382.6697692871094, 399.37628173828125, 416.08282470703125, 432.78936767578125, 449.4958801269531, 466.202392578125, 482.908935546875, 499.615478515625, 516.322021484375, 533.0285034179688, 549.7350463867188, 566.4415893554688, 583.1480712890625, 599.8546142578125, 616.5611572265625, 633.2677001953125, 649.9742431640625, 666.6807250976562, 683.3872680664062]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 9.0, 4.0, 9.0, 12.0, 12.0, 11.0, 14.0, 19.0, 20.0, 32.0, 33.0, 27.0, 21.0, 36.0, 35.0, 82.0, 166.0, 113.0, 42.0, 39.0, 40.0, 29.0, 26.0, 32.0, 27.0, 21.0, 14.0, 14.0, 5.0, 9.0, 3.0, 9.0, 12.0, 6.0, 4.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-140.53233337402344, -136.23532104492188, -131.93829345703125, -127.64127349853516, -123.34425354003906, -119.04723358154297, -114.75021362304688, -110.45319366455078, -106.15617370605469, -101.8591537475586, -97.5621337890625, -93.2651138305664, -88.96809387207031, -84.67107391357422, -80.37405395507812, -76.07703399658203, -71.78001403808594, -67.48299407958984, -63.18597412109375, -58.888954162597656, -54.59193420410156, -50.29491424560547, -45.997894287109375, -41.70087432861328, -37.40385437011719, -33.106834411621094, -28.809814453125, -24.512794494628906, -20.215774536132812, -15.918754577636719, -11.621734619140625, -7.324714660644531, -3.027679443359375, 1.2693405151367188, 5.5663604736328125, 9.863380432128906, 14.160400390625, 18.457420349121094, 22.754440307617188, 27.05146026611328, 31.348480224609375, 35.64550018310547, 39.94252014160156, 44.239540100097656, 48.53656005859375, 52.833580017089844, 57.13059997558594, 61.42761993408203, 65.72463989257812, 70.02165985107422, 74.31867980957031, 78.6156997680664, 82.9127197265625, 87.2097396850586, 91.50675964355469, 95.80377960205078, 100.10079956054688, 104.39781951904297, 108.69483947753906, 112.99185943603516, 117.28887939453125, 121.58589935302734, 125.88291931152344, 130.179931640625, 134.47695922851562]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 13.0, 13.0, 32.0, 33.0, 50.0, 123.0, 187.0, 346.0, 760.0, 1730.0, 4158.0, 14388.0, 82375.0, 763144.0, 2526007.0, 704033.0, 76209.0, 13674.0, 3939.0, 1598.0, 674.0, 345.0, 188.0, 106.0, 62.0, 37.0, 18.0, 14.0, 8.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.875, -19.24365234375, -18.6123046875, -17.98095703125, -17.349609375, -16.71826171875, -16.0869140625, -15.45556640625, -14.82421875, -14.19287109375, -13.5615234375, -12.93017578125, -12.298828125, -11.66748046875, -11.0361328125, -10.40478515625, -9.7734375, -9.14208984375, -8.5107421875, -7.87939453125, -7.248046875, -6.61669921875, -5.9853515625, -5.35400390625, -4.72265625, -4.09130859375, -3.4599609375, -2.82861328125, -2.197265625, -1.56591796875, -0.9345703125, -0.30322265625, 0.328125, 0.95947265625, 1.5908203125, 2.22216796875, 2.853515625, 3.48486328125, 4.1162109375, 4.74755859375, 5.37890625, 6.01025390625, 6.6416015625, 7.27294921875, 7.904296875, 8.53564453125, 9.1669921875, 9.79833984375, 10.4296875, 11.06103515625, 11.6923828125, 12.32373046875, 12.955078125, 13.58642578125, 14.2177734375, 14.84912109375, 15.48046875, 16.11181640625, 16.7431640625, 17.37451171875, 18.005859375, 18.63720703125, 19.2685546875, 19.89990234375, 20.53125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 5.0, 4.0, 6.0, 10.0, 17.0, 17.0, 19.0, 24.0, 27.0, 27.0, 34.0, 34.0, 39.0, 50.0, 52.0, 43.0, 45.0, 48.0, 57.0, 43.0, 48.0, 44.0, 56.0, 40.0, 40.0, 26.0, 32.0, 22.0, 16.0, 20.0, 18.0, 9.0, 9.0, 5.0, 3.0, 6.0, 6.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.40625, -10.115234375, -9.82421875, -9.533203125, -9.2421875, -8.951171875, -8.66015625, -8.369140625, -8.078125, -7.787109375, -7.49609375, -7.205078125, -6.9140625, -6.623046875, -6.33203125, -6.041015625, -5.75, -5.458984375, -5.16796875, -4.876953125, -4.5859375, -4.294921875, -4.00390625, -3.712890625, -3.421875, -3.130859375, -2.83984375, -2.548828125, -2.2578125, -1.966796875, -1.67578125, -1.384765625, -1.09375, -0.802734375, -0.51171875, -0.220703125, 0.0703125, 0.361328125, 0.65234375, 0.943359375, 1.234375, 1.525390625, 1.81640625, 2.107421875, 2.3984375, 2.689453125, 2.98046875, 3.271484375, 3.5625, 3.853515625, 4.14453125, 4.435546875, 4.7265625, 5.017578125, 5.30859375, 5.599609375, 5.890625, 6.181640625, 6.47265625, 6.763671875, 7.0546875, 7.345703125, 7.63671875, 7.927734375, 8.21875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 6.0, 8.0, 7.0, 12.0, 11.0, 33.0, 40.0, 64.0, 145.0, 355.0, 797.0, 2102.0, 12498.0, 3333407.0, 833635.0, 8103.0, 1732.0, 679.0, 332.0, 145.0, 76.0, 49.0, 22.0, 9.0, 8.0, 9.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-82.0, -79.9453125, -77.890625, -75.8359375, -73.78125, -71.7265625, -69.671875, -67.6171875, -65.5625, -63.5078125, -61.453125, -59.3984375, -57.34375, -55.2890625, -53.234375, -51.1796875, -49.125, -47.0703125, -45.015625, -42.9609375, -40.90625, -38.8515625, -36.796875, -34.7421875, -32.6875, -30.6328125, -28.578125, -26.5234375, -24.46875, -22.4140625, -20.359375, -18.3046875, -16.25, -14.1953125, -12.140625, -10.0859375, -8.03125, -5.9765625, -3.921875, -1.8671875, 0.1875, 2.2421875, 4.296875, 6.3515625, 8.40625, 10.4609375, 12.515625, 14.5703125, 16.625, 18.6796875, 20.734375, 22.7890625, 24.84375, 26.8984375, 28.953125, 31.0078125, 33.0625, 35.1171875, 37.171875, 39.2265625, 41.28125, 43.3359375, 45.390625, 47.4453125, 49.5]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 4.0, 16.0, 40.0, 39.0, 46.0, 84.0, 110.0, 129.0, 205.0, 292.0, 433.0, 566.0, 595.0, 484.0, 327.0, 232.0, 149.0, 102.0, 66.0, 44.0, 26.0, 19.0, 18.0, 15.0, 11.0, 4.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.09375, -32.119384765625, -31.14501953125, -30.170654296875, -29.1962890625, -28.221923828125, -27.24755859375, -26.273193359375, -25.298828125, -24.324462890625, -23.35009765625, -22.375732421875, -21.4013671875, -20.427001953125, -19.45263671875, -18.478271484375, -17.50390625, -16.529541015625, -15.55517578125, -14.580810546875, -13.6064453125, -12.632080078125, -11.65771484375, -10.683349609375, -9.708984375, -8.734619140625, -7.76025390625, -6.785888671875, -5.8115234375, -4.837158203125, -3.86279296875, -2.888427734375, -1.9140625, -0.939697265625, 0.03466796875, 1.009033203125, 1.9833984375, 2.957763671875, 3.93212890625, 4.906494140625, 5.880859375, 6.855224609375, 7.82958984375, 8.803955078125, 9.7783203125, 10.752685546875, 11.72705078125, 12.701416015625, 13.67578125, 14.650146484375, 15.62451171875, 16.598876953125, 17.5732421875, 18.547607421875, 19.52197265625, 20.496337890625, 21.470703125, 22.445068359375, 23.41943359375, 24.393798828125, 25.3681640625, 26.342529296875, 27.31689453125, 28.291259765625, 29.265625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 12.0, 20.0, 88.0, 315.0, 378.0, 118.0, 34.0, 24.0, 8.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-817.62255859375, -796.1454467773438, -774.6682739257812, -753.191162109375, -731.7139892578125, -710.2368774414062, -688.759765625, -667.2825927734375, -645.805419921875, -624.3283081054688, -602.8511352539062, -581.3740234375, -559.8968505859375, -538.4197387695312, -516.942626953125, -495.4654541015625, -473.98834228515625, -452.5111999511719, -431.0340576171875, -409.55694580078125, -388.07977294921875, -366.6026611328125, -345.1255187988281, -323.64837646484375, -302.1712341308594, -280.694091796875, -259.2169494628906, -237.7398223876953, -216.26268005371094, -194.78553771972656, -173.30841064453125, -151.83126831054688, -130.3541259765625, -108.87698364257812, -87.39984893798828, -65.92271423339844, -44.44557189941406, -22.968429565429688, -1.491302490234375, 19.98583984375, 41.462982177734375, 62.940120697021484, 84.4172592163086, 105.89439392089844, 127.37153625488281, 148.8486785888672, 170.3258056640625, 191.80294799804688, 213.28009033203125, 234.75723266601562, 256.234375, 277.71148681640625, 299.18865966796875, 320.665771484375, 342.1429138183594, 363.62005615234375, 385.0971984863281, 406.5743408203125, 428.0514831542969, 449.52862548828125, 471.0057373046875, 492.48291015625, 513.9600219726562, 535.4371337890625, 556.914306640625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 5.0, 5.0, 8.0, 5.0, 7.0, 8.0, 15.0, 17.0, 20.0, 22.0, 25.0, 24.0, 45.0, 48.0, 32.0, 44.0, 39.0, 51.0, 41.0, 59.0, 54.0, 63.0, 55.0, 50.0, 38.0, 39.0, 30.0, 23.0, 25.0, 24.0, 15.0, 14.0, 9.0, 9.0, 6.0, 8.0, 3.0, 1.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-159.72996520996094, -154.490234375, -149.25051879882812, -144.01080322265625, -138.7710723876953, -133.53134155273438, -128.2916259765625, -123.0519027709961, -117.81217956542969, -112.57245635986328, -107.33273315429688, -102.09300994873047, -96.85328674316406, -91.61356353759766, -86.37384033203125, -81.13411712646484, -75.89439392089844, -70.65467071533203, -65.41494750976562, -60.17522430419922, -54.93550109863281, -49.695777893066406, -44.4560546875, -39.216331481933594, -33.97660827636719, -28.73688507080078, -23.497161865234375, -18.25743865966797, -13.017715454101562, -7.777992248535156, -2.53826904296875, 2.7014541625976562, 7.9411773681640625, 13.180900573730469, 18.420623779296875, 23.66034698486328, 28.900070190429688, 34.139793395996094, 39.3795166015625, 44.619239807128906, 49.85896301269531, 55.09868621826172, 60.338409423828125, 65.57813262939453, 70.81785583496094, 76.05757904052734, 81.29730224609375, 86.53702545166016, 91.77674865722656, 97.01647186279297, 102.25619506835938, 107.49591827392578, 112.73564147949219, 117.9753646850586, 123.215087890625, 128.45480346679688, 133.6945343017578, 138.93426513671875, 144.17398071289062, 149.4136962890625, 154.65342712402344, 159.89315795898438, 165.13287353515625, 170.37258911132812, 175.61231994628906]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 3.0, 9.0, 6.0, 7.0, 9.0, 12.0, 15.0, 24.0, 35.0, 51.0, 71.0, 90.0, 166.0, 244.0, 413.0, 628.0, 1056.0, 1879.0, 3389.0, 6626.0, 13750.0, 31579.0, 86384.0, 317910.0, 411106.0, 104055.0, 37056.0, 15631.0, 7331.0, 3801.0, 2149.0, 1171.0, 717.0, 399.0, 254.0, 177.0, 115.0, 64.0, 56.0, 19.0, 26.0, 26.0, 9.0, 7.0, 7.0, 7.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-13.375, -12.9447021484375, -12.514404296875, -12.0841064453125, -11.65380859375, -11.2235107421875, -10.793212890625, -10.3629150390625, -9.9326171875, -9.5023193359375, -9.072021484375, -8.6417236328125, -8.21142578125, -7.7811279296875, -7.350830078125, -6.9205322265625, -6.490234375, -6.0599365234375, -5.629638671875, -5.1993408203125, -4.76904296875, -4.3387451171875, -3.908447265625, -3.4781494140625, -3.0478515625, -2.6175537109375, -2.187255859375, -1.7569580078125, -1.32666015625, -0.8963623046875, -0.466064453125, -0.0357666015625, 0.39453125, 0.8248291015625, 1.255126953125, 1.6854248046875, 2.11572265625, 2.5460205078125, 2.976318359375, 3.4066162109375, 3.8369140625, 4.2672119140625, 4.697509765625, 5.1278076171875, 5.55810546875, 5.9884033203125, 6.418701171875, 6.8489990234375, 7.279296875, 7.7095947265625, 8.139892578125, 8.5701904296875, 9.00048828125, 9.4307861328125, 9.861083984375, 10.2913818359375, 10.7216796875, 11.1519775390625, 11.582275390625, 12.0125732421875, 12.44287109375, 12.8731689453125, 13.303466796875, 13.7337646484375, 14.1640625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 8.0, 9.0, 12.0, 17.0, 25.0, 31.0, 33.0, 23.0, 43.0, 41.0, 62.0, 61.0, 71.0, 60.0, 77.0, 69.0, 53.0, 51.0, 67.0, 46.0, 31.0, 27.0, 18.0, 18.0, 18.0, 10.0, 7.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3359375, -11.8905029296875, -11.445068359375, -10.9996337890625, -10.55419921875, -10.1087646484375, -9.663330078125, -9.2178955078125, -8.7724609375, -8.3270263671875, -7.881591796875, -7.4361572265625, -6.99072265625, -6.5452880859375, -6.099853515625, -5.6544189453125, -5.208984375, -4.7635498046875, -4.318115234375, -3.8726806640625, -3.42724609375, -2.9818115234375, -2.536376953125, -2.0909423828125, -1.6455078125, -1.2000732421875, -0.754638671875, -0.3092041015625, 0.13623046875, 0.5816650390625, 1.027099609375, 1.4725341796875, 1.91796875, 2.3634033203125, 2.808837890625, 3.2542724609375, 3.69970703125, 4.1451416015625, 4.590576171875, 5.0360107421875, 5.4814453125, 5.9268798828125, 6.372314453125, 6.8177490234375, 7.26318359375, 7.7086181640625, 8.154052734375, 8.5994873046875, 9.044921875, 9.4903564453125, 9.935791015625, 10.3812255859375, 10.82666015625, 11.2720947265625, 11.717529296875, 12.1629638671875, 12.6083984375, 13.0538330078125, 13.499267578125, 13.9447021484375, 14.39013671875, 14.8355712890625, 15.281005859375, 15.7264404296875, 16.171875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 3.0, 1.0, 8.0, 7.0, 7.0, 13.0, 14.0, 20.0, 39.0, 39.0, 55.0, 106.0, 176.0, 283.0, 556.0, 1393.0, 4660.0, 32955.0, 910659.0, 85659.0, 8318.0, 1936.0, 729.0, 347.0, 213.0, 122.0, 71.0, 56.0, 25.0, 25.0, 16.0, 10.0, 17.0, 4.0, 4.0, 5.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.0, -25.025390625, -24.05078125, -23.076171875, -22.1015625, -21.126953125, -20.15234375, -19.177734375, -18.203125, -17.228515625, -16.25390625, -15.279296875, -14.3046875, -13.330078125, -12.35546875, -11.380859375, -10.40625, -9.431640625, -8.45703125, -7.482421875, -6.5078125, -5.533203125, -4.55859375, -3.583984375, -2.609375, -1.634765625, -0.66015625, 0.314453125, 1.2890625, 2.263671875, 3.23828125, 4.212890625, 5.1875, 6.162109375, 7.13671875, 8.111328125, 9.0859375, 10.060546875, 11.03515625, 12.009765625, 12.984375, 13.958984375, 14.93359375, 15.908203125, 16.8828125, 17.857421875, 18.83203125, 19.806640625, 20.78125, 21.755859375, 22.73046875, 23.705078125, 24.6796875, 25.654296875, 26.62890625, 27.603515625, 28.578125, 29.552734375, 30.52734375, 31.501953125, 32.4765625, 33.451171875, 34.42578125, 35.400390625, 36.375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 3.0, 8.0, 9.0, 7.0, 12.0, 16.0, 20.0, 24.0, 24.0, 32.0, 23.0, 35.0, 48.0, 76.0, 81.0, 82.0, 84.0, 74.0, 68.0, 34.0, 42.0, 38.0, 28.0, 22.0, 19.0, 25.0, 14.0, 11.0, 9.0, 4.0, 3.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-51.03125, -49.6181640625, -48.205078125, -46.7919921875, -45.37890625, -43.9658203125, -42.552734375, -41.1396484375, -39.7265625, -38.3134765625, -36.900390625, -35.4873046875, -34.07421875, -32.6611328125, -31.248046875, -29.8349609375, -28.421875, -27.0087890625, -25.595703125, -24.1826171875, -22.76953125, -21.3564453125, -19.943359375, -18.5302734375, -17.1171875, -15.7041015625, -14.291015625, -12.8779296875, -11.46484375, -10.0517578125, -8.638671875, -7.2255859375, -5.8125, -4.3994140625, -2.986328125, -1.5732421875, -0.16015625, 1.2529296875, 2.666015625, 4.0791015625, 5.4921875, 6.9052734375, 8.318359375, 9.7314453125, 11.14453125, 12.5576171875, 13.970703125, 15.3837890625, 16.796875, 18.2099609375, 19.623046875, 21.0361328125, 22.44921875, 23.8623046875, 25.275390625, 26.6884765625, 28.1015625, 29.5146484375, 30.927734375, 32.3408203125, 33.75390625, 35.1669921875, 36.580078125, 37.9931640625, 39.40625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 1.0, 3.0, 6.0, 7.0, 6.0, 8.0, 6.0, 26.0, 35.0, 51.0, 89.0, 165.0, 303.0, 931.0, 3521.0, 25800.0, 946158.0, 63059.0, 6097.0, 1344.0, 455.0, 192.0, 106.0, 69.0, 33.0, 36.0, 11.0, 8.0, 10.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.2890625, -8.0186767578125, -7.748291015625, -7.4779052734375, -7.20751953125, -6.9371337890625, -6.666748046875, -6.3963623046875, -6.1259765625, -5.8555908203125, -5.585205078125, -5.3148193359375, -5.04443359375, -4.7740478515625, -4.503662109375, -4.2332763671875, -3.962890625, -3.6925048828125, -3.422119140625, -3.1517333984375, -2.88134765625, -2.6109619140625, -2.340576171875, -2.0701904296875, -1.7998046875, -1.5294189453125, -1.259033203125, -0.9886474609375, -0.71826171875, -0.4478759765625, -0.177490234375, 0.0928955078125, 0.36328125, 0.6336669921875, 0.904052734375, 1.1744384765625, 1.44482421875, 1.7152099609375, 1.985595703125, 2.2559814453125, 2.5263671875, 2.7967529296875, 3.067138671875, 3.3375244140625, 3.60791015625, 3.8782958984375, 4.148681640625, 4.4190673828125, 4.689453125, 4.9598388671875, 5.230224609375, 5.5006103515625, 5.77099609375, 6.0413818359375, 6.311767578125, 6.5821533203125, 6.8525390625, 7.1229248046875, 7.393310546875, 7.6636962890625, 7.93408203125, 8.2044677734375, 8.474853515625, 8.7452392578125, 9.015625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 10.0, 8.0, 8.0, 15.0, 7.0, 15.0, 19.0, 27.0, 33.0, 51.0, 72.0, 87.0, 112.0, 105.0, 109.0, 73.0, 65.0, 37.0, 34.0, 27.0, 16.0, 15.0, 12.0, 8.0, 8.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0015878677368164062, -0.0015385299921035767, -0.001489192247390747, -0.0014398545026779175, -0.0013905167579650879, -0.0013411790132522583, -0.0012918412685394287, -0.0012425035238265991, -0.0011931657791137695, -0.00114382803440094, -0.0010944902896881104, -0.0010451525449752808, -0.0009958148002624512, -0.0009464770555496216, -0.000897139310836792, -0.0008478015661239624, -0.0007984638214111328, -0.0007491260766983032, -0.0006997883319854736, -0.000650450587272644, -0.0006011128425598145, -0.0005517750978469849, -0.0005024373531341553, -0.0004530996084213257, -0.0004037618637084961, -0.0003544241189956665, -0.0003050863742828369, -0.0002557486295700073, -0.00020641088485717773, -0.00015707314014434814, -0.00010773539543151855, -5.8397650718688965e-05, -9.059906005859375e-06, 4.0277838706970215e-05, 8.96155834197998e-05, 0.0001389533281326294, 0.00018829107284545898, 0.00023762881755828857, 0.00028696656227111816, 0.00033630430698394775, 0.00038564205169677734, 0.00043497979640960693, 0.0004843175411224365, 0.0005336552858352661, 0.0005829930305480957, 0.0006323307752609253, 0.0006816685199737549, 0.0007310062646865845, 0.0007803440093994141, 0.0008296817541122437, 0.0008790194988250732, 0.0009283572435379028, 0.0009776949882507324, 0.001027032732963562, 0.0010763704776763916, 0.0011257082223892212, 0.0011750459671020508, 0.0012243837118148804, 0.00127372145652771, 0.0013230592012405396, 0.0013723969459533691, 0.0014217346906661987, 0.0014710724353790283, 0.001520410180091858, 0.0015697479248046875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 5.0, 11.0, 15.0, 13.0, 31.0, 46.0, 73.0, 101.0, 186.0, 406.0, 953.0, 2794.0, 12019.0, 126426.0, 871305.0, 26782.0, 4734.0, 1461.0, 566.0, 264.0, 141.0, 80.0, 36.0, 34.0, 26.0, 8.0, 9.0, 7.0, 4.0, 2.0, 3.0, 5.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.91015625, -6.72442626953125, -6.5386962890625, -6.35296630859375, -6.167236328125, -5.98150634765625, -5.7957763671875, -5.61004638671875, -5.42431640625, -5.23858642578125, -5.0528564453125, -4.86712646484375, -4.681396484375, -4.49566650390625, -4.3099365234375, -4.12420654296875, -3.9384765625, -3.75274658203125, -3.5670166015625, -3.38128662109375, -3.195556640625, -3.00982666015625, -2.8240966796875, -2.63836669921875, -2.45263671875, -2.26690673828125, -2.0811767578125, -1.89544677734375, -1.709716796875, -1.52398681640625, -1.3382568359375, -1.15252685546875, -0.966796875, -0.78106689453125, -0.5953369140625, -0.40960693359375, -0.223876953125, -0.03814697265625, 0.1475830078125, 0.33331298828125, 0.51904296875, 0.70477294921875, 0.8905029296875, 1.07623291015625, 1.261962890625, 1.44769287109375, 1.6334228515625, 1.81915283203125, 2.0048828125, 2.19061279296875, 2.3763427734375, 2.56207275390625, 2.747802734375, 2.93353271484375, 3.1192626953125, 3.30499267578125, 3.49072265625, 3.67645263671875, 3.8621826171875, 4.04791259765625, 4.233642578125, 4.41937255859375, 4.6051025390625, 4.79083251953125, 4.9765625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 10.0, 8.0, 17.0, 25.0, 20.0, 44.0, 57.0, 93.0, 133.0, 178.0, 123.0, 123.0, 43.0, 37.0, 29.0, 28.0, 12.0, 10.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.62890625, -6.4039306640625, -6.178955078125, -5.9539794921875, -5.72900390625, -5.5040283203125, -5.279052734375, -5.0540771484375, -4.8291015625, -4.6041259765625, -4.379150390625, -4.1541748046875, -3.92919921875, -3.7042236328125, -3.479248046875, -3.2542724609375, -3.029296875, -2.8043212890625, -2.579345703125, -2.3543701171875, -2.12939453125, -1.9044189453125, -1.679443359375, -1.4544677734375, -1.2294921875, -1.0045166015625, -0.779541015625, -0.5545654296875, -0.32958984375, -0.1046142578125, 0.120361328125, 0.3453369140625, 0.5703125, 0.7952880859375, 1.020263671875, 1.2452392578125, 1.47021484375, 1.6951904296875, 1.920166015625, 2.1451416015625, 2.3701171875, 2.5950927734375, 2.820068359375, 3.0450439453125, 3.27001953125, 3.4949951171875, 3.719970703125, 3.9449462890625, 4.169921875, 4.3948974609375, 4.619873046875, 4.8448486328125, 5.06982421875, 5.2947998046875, 5.519775390625, 5.7447509765625, 5.9697265625, 6.1947021484375, 6.419677734375, 6.6446533203125, 6.86962890625, 7.0946044921875, 7.319580078125, 7.5445556640625, 7.76953125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 13.0, 23.0, 45.0, 105.0, 561.0, 143.0, 54.0, 26.0, 13.0, 8.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-207.2810821533203, -198.8896942138672, -190.49830627441406, -182.10691833496094, -173.7155303955078, -165.3241424560547, -156.93276977539062, -148.5413818359375, -140.14999389648438, -131.75860595703125, -123.36721801757812, -114.975830078125, -106.58444213867188, -98.19305419921875, -89.80167388916016, -81.41028594970703, -73.01889038085938, -64.62750244140625, -56.236114501953125, -47.844730377197266, -39.45334243774414, -31.061954498291016, -22.670570373535156, -14.279182434082031, -5.887794494628906, 2.5035924911499023, 10.894979476928711, 19.286365509033203, 27.677753448486328, 36.06914138793945, 44.46052551269531, 52.85191345214844, 61.243316650390625, 69.63470458984375, 78.02609252929688, 86.41748046875, 94.80886840820312, 103.20025634765625, 111.59163665771484, 119.98302459716797, 128.37442016601562, 136.76580810546875, 145.15719604492188, 153.548583984375, 161.93997192382812, 170.33135986328125, 178.72274780273438, 187.1141357421875, 195.50550842285156, 203.8968963623047, 212.2882843017578, 220.67967224121094, 229.07106018066406, 237.4624481201172, 245.85382080078125, 254.24520874023438, 262.6365966796875, 271.0279846191406, 279.41937255859375, 287.8107604980469, 296.2021484375, 304.5935363769531, 312.98492431640625, 321.3763122558594, 329.7677001953125]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 6.0, 6.0, 14.0, 17.0, 16.0, 16.0, 19.0, 15.0, 16.0, 26.0, 25.0, 19.0, 29.0, 44.0, 132.0, 274.0, 90.0, 34.0, 25.0, 26.0, 16.0, 18.0, 21.0, 19.0, 8.0, 8.0, 11.0, 8.0, 7.0, 9.0, 6.0, 2.0, 4.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-124.81257629394531, -121.07792663574219, -117.34327697753906, -113.60862731933594, -109.87397766113281, -106.13932800292969, -102.40467834472656, -98.67002868652344, -94.93537902832031, -91.20072937011719, -87.46607971191406, -83.73143005371094, -79.99678039550781, -76.26213073730469, -72.52748107910156, -68.79283142089844, -65.05817413330078, -61.323524475097656, -57.58887481689453, -53.854225158691406, -50.11957550048828, -46.384925842285156, -42.650272369384766, -38.91562271118164, -35.180973052978516, -31.44632339477539, -27.711673736572266, -23.977022171020508, -20.242372512817383, -16.507722854614258, -12.7730712890625, -9.038421630859375, -5.303779602050781, -1.569129467010498, 2.165520668029785, 5.900171279907227, 9.634820938110352, 13.369470596313477, 17.104122161865234, 20.83877182006836, 24.573421478271484, 28.30807113647461, 32.042720794677734, 35.777374267578125, 39.51202392578125, 43.246673583984375, 46.9813232421875, 50.715972900390625, 54.45062255859375, 58.185272216796875, 61.919921875, 65.65457153320312, 69.38922119140625, 73.12387084960938, 76.8585205078125, 80.59317016601562, 84.32781982421875, 88.06246948242188, 91.797119140625, 95.53176879882812, 99.26641845703125, 103.00106811523438, 106.7357177734375, 110.47036743164062, 114.20502471923828]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 2.0, 2.0, 3.0, 9.0, 7.0, 12.0, 12.0, 20.0, 23.0, 19.0, 27.0, 32.0, 24.0, 42.0, 58.0, 112.0, 256.0, 75.0, 50.0, 23.0, 41.0, 24.0, 26.0, 17.0, 12.0, 18.0, 8.0, 12.0, 10.0, 7.0, 5.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5234375, -12.1683349609375, -11.813232421875, -11.4581298828125, -11.10302734375, -10.7479248046875, -10.392822265625, -10.0377197265625, -9.6826171875, -9.3275146484375, -8.972412109375, -8.6173095703125, -8.26220703125, -7.9071044921875, -7.552001953125, -7.1968994140625, -6.841796875, -6.4866943359375, -6.131591796875, -5.7764892578125, -5.42138671875, -5.0662841796875, -4.711181640625, -4.3560791015625, -4.0009765625, -3.6458740234375, -3.290771484375, -2.9356689453125, -2.58056640625, -2.2254638671875, -1.870361328125, -1.5152587890625, -1.16015625, -0.8050537109375, -0.449951171875, -0.0948486328125, 0.26025390625, 0.6153564453125, 0.970458984375, 1.3255615234375, 1.6806640625, 2.0357666015625, 2.390869140625, 2.7459716796875, 3.10107421875, 3.4561767578125, 3.811279296875, 4.1663818359375, 4.521484375, 4.8765869140625, 5.231689453125, 5.5867919921875, 5.94189453125, 6.2969970703125, 6.652099609375, 7.0072021484375, 7.3623046875, 7.7174072265625, 8.072509765625, 8.4276123046875, 8.78271484375, 9.1378173828125, 9.492919921875, 9.8480224609375, 10.203125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 4.0, 12.0, 15.0, 29.0, 25.0, 56.0, 59.0, 148.0, 431.0, 2881.0, 8321010.0, 61463.0, 1824.0, 317.0, 97.0, 65.0, 42.0, 27.0, 11.0, 12.0, 4.0, 1.0, 7.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0], "bins": [-170.0876922607422, -163.993408203125, -157.8991241455078, -151.80484008789062, -145.7105712890625, -139.6162872314453, -133.52200317382812, -127.42771911621094, -121.33344268798828, -115.2391586303711, -109.14488220214844, -103.05059814453125, -96.95631408691406, -90.8620376586914, -84.76775360107422, -78.67347717285156, -72.57919311523438, -66.48490905761719, -60.39063262939453, -54.296348571777344, -48.20206832885742, -42.1077880859375, -36.01350402832031, -29.91922378540039, -23.82494354248047, -17.730663299560547, -11.636381149291992, -5.5420989990234375, 0.5521812438964844, 6.646461486816406, 12.740745544433594, 18.835025787353516, 24.929290771484375, 31.023571014404297, 37.11785125732422, 43.212135314941406, 49.30641555786133, 55.40069580078125, 61.49497985839844, 67.58926391601562, 73.68354034423828, 79.77782440185547, 85.87210083007812, 91.96638488769531, 98.0606689453125, 104.15494537353516, 110.24922943115234, 116.343505859375, 122.43778991699219, 128.53207397460938, 134.62635803222656, 140.72064208984375, 146.81491088867188, 152.90919494628906, 159.00347900390625, 165.09776306152344, 171.19204711914062, 177.2863311767578, 183.380615234375, 189.47488403320312, 195.5691680908203, 201.6634521484375, 207.7577362060547, 213.85202026367188, 219.9462890625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 3.0, 1.0, 3.0, 2.0, 3.0, 8.0, 4.0, 4.0, 3.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-139.7555389404297, -135.02426147460938, -130.29296875, -125.56168365478516, -120.83039855957031, -116.09912109375, -111.36783599853516, -106.63655090332031, -101.90526580810547, -97.17398071289062, -92.44269561767578, -87.71141052246094, -82.98013305664062, -78.24884033203125, -73.51756286621094, -68.7862777709961, -64.05499267578125, -59.323707580566406, -54.59242248535156, -49.861141204833984, -45.12985610961914, -40.3985710144043, -35.66728973388672, -30.936004638671875, -26.20471954345703, -21.473434448242188, -16.742151260375977, -12.01086711883545, -7.279582977294922, -2.548297882080078, 2.182985305786133, 6.914268493652344, 11.64556884765625, 16.376853942871094, 21.108137130737305, 25.839420318603516, 30.57070541381836, 35.3019905090332, 40.03327178955078, 44.764556884765625, 49.49584197998047, 54.22712707519531, 58.958412170410156, 63.689693450927734, 68.42097473144531, 73.15226745605469, 77.883544921875, 82.61483001708984, 87.34611511230469, 92.07740020751953, 96.80868530273438, 101.53997039794922, 106.27125549316406, 111.00253295898438, 115.73381805419922, 120.46510314941406, 125.1963882446289, 129.92767333984375, 134.65895080566406, 139.39024353027344, 144.12152099609375, 148.85281372070312, 153.58409118652344, 158.31536865234375, 163.04666137695312]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 11.0, 7.0, 4.0, 15.0, 15.0, 21.0, 25.0, 43.0, 45.0, 56.0, 71.0, 124.0, 145.0, 208.0, 324.0, 563.0, 1147.0, 2484.0, 5763.0, 14821.0, 38991.0, 101966.0, 184930.0, 105749.0, 40292.0, 15179.0, 6045.0, 2517.0, 1136.0, 586.0, 323.0, 190.0, 119.0, 92.0, 73.0, 35.0, 40.0, 29.0, 17.0, 19.0, 14.0, 12.0, 10.0, 0.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.4375, -58.318359375, -56.19921875, -54.080078125, -51.9609375, -49.841796875, -47.72265625, -45.603515625, -43.484375, -41.365234375, -39.24609375, -37.126953125, -35.0078125, -32.888671875, -30.76953125, -28.650390625, -26.53125, -24.412109375, -22.29296875, -20.173828125, -18.0546875, -15.935546875, -13.81640625, -11.697265625, -9.578125, -7.458984375, -5.33984375, -3.220703125, -1.1015625, 1.017578125, 3.13671875, 5.255859375, 7.375, 9.494140625, 11.61328125, 13.732421875, 15.8515625, 17.970703125, 20.08984375, 22.208984375, 24.328125, 26.447265625, 28.56640625, 30.685546875, 32.8046875, 34.923828125, 37.04296875, 39.162109375, 41.28125, 43.400390625, 45.51953125, 47.638671875, 49.7578125, 51.876953125, 53.99609375, 56.115234375, 58.234375, 60.353515625, 62.47265625, 64.591796875, 66.7109375, 68.830078125, 70.94921875, 73.068359375, 75.1875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 5.0, 8.0, 11.0, 12.0, 18.0, 21.0, 29.0, 32.0, 38.0, 45.0, 70.0, 74.0, 90.0, 78.0, 78.0, 75.0, 62.0, 59.0, 36.0, 48.0, 21.0, 24.0, 25.0, 9.0, 11.0, 6.0, 7.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.171875, -12.7274169921875, -12.282958984375, -11.8385009765625, -11.39404296875, -10.9495849609375, -10.505126953125, -10.0606689453125, -9.6162109375, -9.1717529296875, -8.727294921875, -8.2828369140625, -7.83837890625, -7.3939208984375, -6.949462890625, -6.5050048828125, -6.060546875, -5.6160888671875, -5.171630859375, -4.7271728515625, -4.28271484375, -3.8382568359375, -3.393798828125, -2.9493408203125, -2.5048828125, -2.0604248046875, -1.615966796875, -1.1715087890625, -0.72705078125, -0.2825927734375, 0.161865234375, 0.6063232421875, 1.05078125, 1.4952392578125, 1.939697265625, 2.3841552734375, 2.82861328125, 3.2730712890625, 3.717529296875, 4.1619873046875, 4.6064453125, 5.0509033203125, 5.495361328125, 5.9398193359375, 6.38427734375, 6.8287353515625, 7.273193359375, 7.7176513671875, 8.162109375, 8.6065673828125, 9.051025390625, 9.4954833984375, 9.93994140625, 10.3843994140625, 10.828857421875, 11.2733154296875, 11.7177734375, 12.1622314453125, 12.606689453125, 13.0511474609375, 13.49560546875, 13.9400634765625, 14.384521484375, 14.8289794921875, 15.2734375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 10.0, 25.0, 66.0, 125.0, 140.0, 76.0, 22.0, 6.0, 4.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.9715690612793, -59.34646987915039, -54.72137451171875, -50.096275329589844, -45.47117614746094, -40.8460807800293, -36.22098159790039, -31.59588623046875, -26.970787048339844, -22.34568977355957, -17.720592498779297, -13.09549331665039, -8.470396041870117, -3.8452987670898438, 0.7798004150390625, 5.404895782470703, 10.02999496459961, 14.655092239379883, 19.280189514160156, 23.905288696289062, 28.530385971069336, 33.15548324584961, 37.780582427978516, 42.405677795410156, 47.03077697753906, 51.65587615966797, 56.28097152709961, 60.906070709228516, 65.53116607666016, 70.15626525878906, 74.78136444091797, 79.40646362304688, 84.03155517578125, 88.65665435791016, 93.28175354003906, 97.90684509277344, 102.53194427490234, 107.15704345703125, 111.78214263916016, 116.40724182128906, 121.03233337402344, 125.65743255615234, 130.28253173828125, 134.90762329101562, 139.53273010253906, 144.15782165527344, 148.78292846679688, 153.40802001953125, 158.03311157226562, 162.658203125, 167.28330993652344, 171.9084014892578, 176.53350830078125, 181.15859985351562, 185.78369140625, 190.40879821777344, 195.03390502929688, 199.65899658203125, 204.2841033935547, 208.90919494628906, 213.5343017578125, 218.15939331054688, 222.78448486328125, 227.4095916748047, 232.03468322753906]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 12.0, 5.0, 11.0, 12.0, 20.0, 85.0, 146.0, 115.0, 41.0, 10.0, 13.0, 7.0, 7.0, 0.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.4468994140625, -97.94044494628906, -94.43399047851562, -90.92753601074219, -87.42108154296875, -83.91462707519531, -80.40817260742188, -76.90172576904297, -73.39527130126953, -69.8888168334961, -66.38236236572266, -62.87590789794922, -59.36945724487305, -55.86300277709961, -52.35654830932617, -48.85009765625, -45.3436393737793, -41.83718490600586, -38.33073043823242, -34.82427978515625, -31.317825317382812, -27.811370849609375, -24.304916381835938, -20.798463821411133, -17.292009353637695, -13.785555839538574, -10.279102325439453, -6.772647857666016, -3.2661943435668945, 0.24025917053222656, 3.746713638305664, 7.253166198730469, 10.759620666503906, 14.266074180603027, 17.77252769470215, 21.278982162475586, 24.78543472290039, 28.291889190673828, 31.798343658447266, 35.30479431152344, 38.811248779296875, 42.31770324707031, 45.82415771484375, 49.33061218261719, 52.83706283569336, 56.3435173034668, 59.849971771240234, 63.356422424316406, 66.86288452148438, 70.36933898925781, 73.87579345703125, 77.38224792480469, 80.88870239257812, 84.39515686035156, 87.901611328125, 91.4080581665039, 94.91451263427734, 98.42096710205078, 101.92742156982422, 105.43387603759766, 108.9403305053711, 112.44677734375, 115.95323181152344, 119.45968627929688, 122.96614074707031]}, "eval/loss": 6.791457653045654, "eval/wer": 1.820663928408437, "eval/runtime": 1551.0153, "eval/samples_per_second": 1.703, "eval/steps_per_second": 0.426} \ No newline at end of file +{"train/loss": 6.613, "train/learning_rate": 2.5588667777668858e-05, "train/epoch": 0.56, "train/global_step": 2000, "_runtime": 8783, "_timestamp": 1646223062, "_step": 2003, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 15.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30304.0, 150.0, 25.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4046.0, -3966.328125, -3886.65625, -3806.984375, -3727.3125, -3647.640625, -3567.96875, -3488.296875, -3408.625, -3328.953125, -3249.28125, -3169.609375, -3089.9375, -3010.265625, -2930.59375, -2850.921875, -2771.25, -2691.578125, -2611.90625, -2532.234375, -2452.5625, -2372.890625, -2293.21875, -2213.546875, -2133.875, -2054.203125, -1974.53125, -1894.859375, -1815.1875, -1735.515625, -1655.84375, -1576.171875, -1496.5, -1416.828125, -1337.15625, -1257.484375, -1177.8125, -1098.140625, -1018.46875, -938.796875, -859.125, -779.453125, -699.78125, -620.109375, -540.4375, -460.765625, -381.09375, -301.421875, -221.75, -142.078125, -62.40625, 17.265625, 96.9375, 176.609375, 256.28125, 335.953125, 415.625, 495.296875, 574.96875, 654.640625, 734.3125, 813.984375, 893.65625, 973.328125, 1053.0]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 12.0, 13.0, 16.0, 32.0, 30.0, 39.0, 50.0, 62.0, 87.0, 84.0, 96.0, 96.0, 66.0, 79.0, 56.0, 46.0, 27.0, 22.0, 25.0, 12.0, 7.0, 11.0, 5.0, 4.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-644.0227661132812, -622.0311889648438, -600.0396728515625, -578.048095703125, -556.0565795898438, -534.0650024414062, -512.073486328125, -490.0819091796875, -468.0903625488281, -446.09881591796875, -424.1072692871094, -402.11572265625, -380.1241455078125, -358.13262939453125, -336.14105224609375, -314.1495056152344, -292.157958984375, -270.1664123535156, -248.17486572265625, -226.1833038330078, -204.19175720214844, -182.20021057128906, -160.20864868164062, -138.21710205078125, -116.22555541992188, -94.2340087890625, -72.2424545288086, -50.25090026855469, -28.259353637695312, -6.2678070068359375, 15.7237548828125, 37.715301513671875, 59.706787109375, 81.69833374023438, 103.68988800048828, 125.68144226074219, 147.67298889160156, 169.66453552246094, 191.65609741210938, 213.64764404296875, 235.63919067382812, 257.6307373046875, 279.6222839355469, 301.61383056640625, 323.60540771484375, 345.596923828125, 367.5885009765625, 389.5800476074219, 411.57159423828125, 433.5631408691406, 455.5546875, 477.5462646484375, 499.53778076171875, 521.5293579101562, 543.5208740234375, 565.512451171875, 587.5040283203125, 609.49560546875, 631.4871215820312, 653.4786987304688, 675.47021484375, 697.4617919921875, 719.453369140625, 741.4448852539062, 763.4364013671875]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 7.0, 1.0, 5.0, 2.0, 4.0, 5.0, 4.0, 13.0, 14.0, 20.0, 14.0, 10.0, 20.0, 14.0, 28.0, 25.0, 24.0, 31.0, 31.0, 32.0, 28.0, 26.0, 38.0, 41.0, 40.0, 38.0, 29.0, 54.0, 44.0, 34.0, 37.0, 37.0, 39.0, 21.0, 25.0, 19.0, 15.0, 12.0, 25.0, 13.0, 14.0, 10.0, 15.0, 11.0, 8.0, 6.0, 2.0, 7.0, 3.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0], "bins": [-418.6318359375, -406.0548400878906, -393.47784423828125, -380.9008483886719, -368.3238525390625, -355.7468566894531, -343.16986083984375, -330.5928649902344, -318.015869140625, -305.4388732910156, -292.86187744140625, -280.2848815917969, -267.7078857421875, -255.13088989257812, -242.55389404296875, -229.97689819335938, -217.39990234375, -204.82290649414062, -192.24591064453125, -179.66891479492188, -167.0919189453125, -154.51492309570312, -141.93792724609375, -129.36093139648438, -116.783935546875, -104.20693969726562, -91.62994384765625, -79.05294799804688, -66.4759521484375, -53.898956298828125, -41.32196044921875, -28.744964599609375, -16.16796875, -3.590972900390625, 8.98602294921875, 21.563018798828125, 34.1400146484375, 46.717010498046875, 59.29400634765625, 71.87100219726562, 84.447998046875, 97.02499389648438, 109.60198974609375, 122.17898559570312, 134.7559814453125, 147.33297729492188, 159.90997314453125, 172.48696899414062, 185.06396484375, 197.64096069335938, 210.21795654296875, 222.79495239257812, 235.3719482421875, 247.94894409179688, 260.52593994140625, 273.1029357910156, 285.679931640625, 298.2569274902344, 310.83392333984375, 323.4109191894531, 335.9879150390625, 348.5649108886719, 361.14190673828125, 373.7189025878906, 386.2958984375]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 9.0, 10.0, 18.0, 18.0, 20.0, 34.0, 49.0, 72.0, 88.0, 143.0, 175.0, 251.0, 387.0, 563.0, 835.0, 1302.0, 1927.0, 3116.0, 4883.0, 7751.0, 12784.0, 21245.0, 36686.0, 68373.0, 168833.0, 444698.0, 131770.0, 59792.0, 32653.0, 18911.0, 11476.0, 7116.0, 4501.0, 2685.0, 1761.0, 1167.0, 767.0, 523.0, 359.0, 254.0, 137.0, 125.0, 88.0, 58.0, 54.0, 27.0, 23.0, 14.0, 9.0, 4.0, 8.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1196.0, -1155.3125, -1114.625, -1073.9375, -1033.25, -992.5625, -951.875, -911.1875, -870.5, -829.8125, -789.125, -748.4375, -707.75, -667.0625, -626.375, -585.6875, -545.0, -504.3125, -463.625, -422.9375, -382.25, -341.5625, -300.875, -260.1875, -219.5, -178.8125, -138.125, -97.4375, -56.75, -16.0625, 24.625, 65.3125, 106.0, 146.6875, 187.375, 228.0625, 268.75, 309.4375, 350.125, 390.8125, 431.5, 472.1875, 512.875, 553.5625, 594.25, 634.9375, 675.625, 716.3125, 757.0, 797.6875, 838.375, 879.0625, 919.75, 960.4375, 1001.125, 1041.8125, 1082.5, 1123.1875, 1163.875, 1204.5625, 1245.25, 1285.9375, 1326.625, 1367.3125, 1408.0]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 6.0, 2.0, 6.0, 7.0, 5.0, 14.0, 9.0, 10.0, 7.0, 14.0, 14.0, 17.0, 22.0, 28.0, 35.0, 45.0, 73.0, 107.0, 148.0, 100.0, 74.0, 41.0, 39.0, 18.0, 22.0, 17.0, 16.0, 19.0, 12.0, 16.0, 11.0, 4.0, 6.0, 3.0, 6.0, 3.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-362.5, -350.23046875, -337.9609375, -325.69140625, -313.421875, -301.15234375, -288.8828125, -276.61328125, -264.34375, -252.07421875, -239.8046875, -227.53515625, -215.265625, -202.99609375, -190.7265625, -178.45703125, -166.1875, -153.91796875, -141.6484375, -129.37890625, -117.109375, -104.83984375, -92.5703125, -80.30078125, -68.03125, -55.76171875, -43.4921875, -31.22265625, -18.953125, -6.68359375, 5.5859375, 17.85546875, 30.125, 42.39453125, 54.6640625, 66.93359375, 79.203125, 91.47265625, 103.7421875, 116.01171875, 128.28125, 140.55078125, 152.8203125, 165.08984375, 177.359375, 189.62890625, 201.8984375, 214.16796875, 226.4375, 238.70703125, 250.9765625, 263.24609375, 275.515625, 287.78515625, 300.0546875, 312.32421875, 324.59375, 336.86328125, 349.1328125, 361.40234375, 373.671875, 385.94140625, 398.2109375, 410.48046875, 422.75]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 2.0, 5.0, 7.0, 7.0, 7.0, 11.0, 18.0, 9.0, 13.0, 22.0, 27.0, 40.0, 51.0, 47.0, 60.0, 64.0, 74.0, 67.0, 78.0, 61.0, 61.0, 52.0, 47.0, 34.0, 23.0, 23.0, 19.0, 14.0, 8.0, 5.0, 12.0, 6.0, 6.0, 8.0, 2.0, 6.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-249.9314727783203, -242.275390625, -234.61929321289062, -226.96319580078125, -219.30711364746094, -211.65103149414062, -203.99493408203125, -196.33883666992188, -188.68275451660156, -181.02667236328125, -173.37057495117188, -165.7144775390625, -158.0583953857422, -150.40231323242188, -142.7462158203125, -135.09011840820312, -127.43403625488281, -119.77794647216797, -112.12185668945312, -104.46576690673828, -96.80967712402344, -89.1535873413086, -81.49749755859375, -73.8414077758789, -66.18531799316406, -58.52922821044922, -50.873138427734375, -43.21704864501953, -35.56095886230469, -27.904869079589844, -20.248779296875, -12.592689514160156, -4.93658447265625, 2.7195053100585938, 10.375595092773438, 18.03168487548828, 25.687774658203125, 33.34386444091797, 40.99995422363281, 48.656044006347656, 56.3121337890625, 63.968223571777344, 71.62431335449219, 79.28040313720703, 86.93649291992188, 94.59258270263672, 102.24867248535156, 109.9047622680664, 117.56085205078125, 125.2169418334961, 132.87303161621094, 140.52911376953125, 148.18521118164062, 155.84130859375, 163.4973907470703, 171.15347290039062, 178.8095703125, 186.46566772460938, 194.1217498779297, 201.77783203125, 209.43392944335938, 217.09002685546875, 224.74610900878906, 232.40219116210938, 240.05828857421875]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 7.0, 7.0, 7.0, 4.0, 13.0, 10.0, 14.0, 15.0, 9.0, 14.0, 22.0, 15.0, 32.0, 24.0, 31.0, 35.0, 37.0, 33.0, 36.0, 44.0, 30.0, 34.0, 41.0, 33.0, 27.0, 36.0, 42.0, 33.0, 32.0, 28.0, 29.0, 36.0, 27.0, 24.0, 17.0, 17.0, 23.0, 15.0, 18.0, 13.0, 8.0, 7.0, 6.0, 4.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-174.856201171875, -169.59498596191406, -164.33377075195312, -159.07257080078125, -153.8113555908203, -148.55014038085938, -143.2889404296875, -138.02772521972656, -132.76651000976562, -127.50529479980469, -122.24408721923828, -116.98287963867188, -111.72166442871094, -106.46044921875, -101.1992416381836, -95.93803405761719, -90.67681884765625, -85.41560363769531, -80.1543960571289, -74.8931884765625, -69.63197326660156, -64.37075805664062, -59.10955047607422, -53.84833908081055, -48.587127685546875, -43.3259162902832, -38.06470489501953, -32.80349349975586, -27.542282104492188, -22.281070709228516, -17.019859313964844, -11.758647918701172, -6.4974365234375, -1.2362251281738281, 4.024986267089844, 9.286197662353516, 14.547409057617188, 19.80862045288086, 25.06983184814453, 30.331043243408203, 35.592254638671875, 40.85346603393555, 46.11467742919922, 51.37588882446289, 56.63710021972656, 61.898311614990234, 67.1595230102539, 72.42073059082031, 77.68194580078125, 82.94316101074219, 88.2043685913086, 93.465576171875, 98.72679138183594, 103.98800659179688, 109.24921417236328, 114.51042175292969, 119.77163696289062, 125.03285217285156, 130.2940673828125, 135.55526733398438, 140.8164825439453, 146.07769775390625, 151.33889770507812, 156.60011291503906, 161.861328125]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 4.0, 9.0, 10.0, 13.0, 30.0, 27.0, 54.0, 62.0, 104.0, 154.0, 249.0, 324.0, 507.0, 665.0, 1026.0, 1465.0, 2000.0, 3003.0, 4400.0, 6544.0, 9300.0, 13939.0, 20857.0, 31236.0, 48753.0, 78673.0, 135441.0, 310073.0, 1035601.0, 1461191.0, 564349.0, 189489.0, 101190.0, 61027.0, 38452.0, 24877.0, 16097.0, 10820.0, 7262.0, 4867.0, 3255.0, 2283.0, 1555.0, 1016.0, 676.0, 467.0, 282.0, 202.0, 152.0, 73.0, 69.0, 40.0, 31.0, 24.0, 13.0, 7.0, 1.0, 4.0, 0.0, 2.0], "bins": [-193.125, -187.314453125, -181.50390625, -175.693359375, -169.8828125, -164.072265625, -158.26171875, -152.451171875, -146.640625, -140.830078125, -135.01953125, -129.208984375, -123.3984375, -117.587890625, -111.77734375, -105.966796875, -100.15625, -94.345703125, -88.53515625, -82.724609375, -76.9140625, -71.103515625, -65.29296875, -59.482421875, -53.671875, -47.861328125, -42.05078125, -36.240234375, -30.4296875, -24.619140625, -18.80859375, -12.998046875, -7.1875, -1.376953125, 4.43359375, 10.244140625, 16.0546875, 21.865234375, 27.67578125, 33.486328125, 39.296875, 45.107421875, 50.91796875, 56.728515625, 62.5390625, 68.349609375, 74.16015625, 79.970703125, 85.78125, 91.591796875, 97.40234375, 103.212890625, 109.0234375, 114.833984375, 120.64453125, 126.455078125, 132.265625, 138.076171875, 143.88671875, 149.697265625, 155.5078125, 161.318359375, 167.12890625, 172.939453125, 178.75]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 8.0, 10.0, 8.0, 10.0, 18.0, 12.0, 14.0, 14.0, 22.0, 17.0, 21.0, 28.0, 35.0, 34.0, 29.0, 36.0, 30.0, 30.0, 39.0, 32.0, 49.0, 36.0, 47.0, 55.0, 30.0, 30.0, 42.0, 30.0, 30.0, 28.0, 26.0, 18.0, 18.0, 22.0, 15.0, 9.0, 15.0, 11.0, 12.0, 9.0, 5.0, 3.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-88.9375, -86.216796875, -83.49609375, -80.775390625, -78.0546875, -75.333984375, -72.61328125, -69.892578125, -67.171875, -64.451171875, -61.73046875, -59.009765625, -56.2890625, -53.568359375, -50.84765625, -48.126953125, -45.40625, -42.685546875, -39.96484375, -37.244140625, -34.5234375, -31.802734375, -29.08203125, -26.361328125, -23.640625, -20.919921875, -18.19921875, -15.478515625, -12.7578125, -10.037109375, -7.31640625, -4.595703125, -1.875, 0.845703125, 3.56640625, 6.287109375, 9.0078125, 11.728515625, 14.44921875, 17.169921875, 19.890625, 22.611328125, 25.33203125, 28.052734375, 30.7734375, 33.494140625, 36.21484375, 38.935546875, 41.65625, 44.376953125, 47.09765625, 49.818359375, 52.5390625, 55.259765625, 57.98046875, 60.701171875, 63.421875, 66.142578125, 68.86328125, 71.583984375, 74.3046875, 77.025390625, 79.74609375, 82.466796875, 85.1875]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 5.0, 11.0, 11.0, 16.0, 21.0, 44.0, 57.0, 101.0, 150.0, 230.0, 354.0, 567.0, 1005.0, 1665.0, 2805.0, 4839.0, 8672.0, 15574.0, 27724.0, 51440.0, 99196.0, 203011.0, 463027.0, 1359205.0, 1165683.0, 409169.0, 183649.0, 90201.0, 47401.0, 25635.0, 14102.0, 7886.0, 4430.0, 2677.0, 1486.0, 874.0, 510.0, 305.0, 196.0, 143.0, 75.0, 38.0, 24.0, 22.0, 23.0, 11.0, 6.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0], "bins": [-191.5, -186.017578125, -180.53515625, -175.052734375, -169.5703125, -164.087890625, -158.60546875, -153.123046875, -147.640625, -142.158203125, -136.67578125, -131.193359375, -125.7109375, -120.228515625, -114.74609375, -109.263671875, -103.78125, -98.298828125, -92.81640625, -87.333984375, -81.8515625, -76.369140625, -70.88671875, -65.404296875, -59.921875, -54.439453125, -48.95703125, -43.474609375, -37.9921875, -32.509765625, -27.02734375, -21.544921875, -16.0625, -10.580078125, -5.09765625, 0.384765625, 5.8671875, 11.349609375, 16.83203125, 22.314453125, 27.796875, 33.279296875, 38.76171875, 44.244140625, 49.7265625, 55.208984375, 60.69140625, 66.173828125, 71.65625, 77.138671875, 82.62109375, 88.103515625, 93.5859375, 99.068359375, 104.55078125, 110.033203125, 115.515625, 120.998046875, 126.48046875, 131.962890625, 137.4453125, 142.927734375, 148.41015625, 153.892578125, 159.375]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 11.0, 21.0, 25.0, 25.0, 29.0, 43.0, 46.0, 54.0, 79.0, 86.0, 117.0, 126.0, 157.0, 211.0, 280.0, 345.0, 408.0, 407.0, 338.0, 230.0, 197.0, 159.0, 115.0, 114.0, 86.0, 57.0, 47.0, 51.0, 40.0, 36.0, 27.0, 19.0, 20.0, 11.0, 15.0, 12.0, 7.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.875, -44.23779296875, -42.6005859375, -40.96337890625, -39.326171875, -37.68896484375, -36.0517578125, -34.41455078125, -32.77734375, -31.14013671875, -29.5029296875, -27.86572265625, -26.228515625, -24.59130859375, -22.9541015625, -21.31689453125, -19.6796875, -18.04248046875, -16.4052734375, -14.76806640625, -13.130859375, -11.49365234375, -9.8564453125, -8.21923828125, -6.58203125, -4.94482421875, -3.3076171875, -1.67041015625, -0.033203125, 1.60400390625, 3.2412109375, 4.87841796875, 6.515625, 8.15283203125, 9.7900390625, 11.42724609375, 13.064453125, 14.70166015625, 16.3388671875, 17.97607421875, 19.61328125, 21.25048828125, 22.8876953125, 24.52490234375, 26.162109375, 27.79931640625, 29.4365234375, 31.07373046875, 32.7109375, 34.34814453125, 35.9853515625, 37.62255859375, 39.259765625, 40.89697265625, 42.5341796875, 44.17138671875, 45.80859375, 47.44580078125, 49.0830078125, 50.72021484375, 52.357421875, 53.99462890625, 55.6318359375, 57.26904296875, 58.90625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 8.0, 8.0, 7.0, 24.0, 17.0, 21.0, 37.0, 37.0, 45.0, 59.0, 68.0, 64.0, 80.0, 90.0, 75.0, 68.0, 52.0, 42.0, 52.0, 32.0, 26.0, 14.0, 22.0, 12.0, 9.0, 8.0, 12.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-161.36619567871094, -156.6692352294922, -151.97227478027344, -147.2753143310547, -142.57835388183594, -137.8813934326172, -133.18443298339844, -128.4874725341797, -123.79051208496094, -119.09355163574219, -114.39659118652344, -109.69963073730469, -105.00267028808594, -100.30570983886719, -95.60874938964844, -90.91178894042969, -86.21483612060547, -81.51787567138672, -76.82091522216797, -72.12395477294922, -67.42699432373047, -62.73003387451172, -58.033077239990234, -53.336116790771484, -48.639156341552734, -43.942195892333984, -39.245235443115234, -34.54827880859375, -29.851316452026367, -25.154356002807617, -20.4573974609375, -15.76043701171875, -11.0634765625, -6.366516590118408, -1.6695566177368164, 3.027402877807617, 7.724363327026367, 12.421323776245117, 17.118282318115234, 21.815242767333984, 26.512203216552734, 31.209163665771484, 35.906124114990234, 40.60308074951172, 45.30004119873047, 49.99700164794922, 54.69396209716797, 59.39092254638672, 64.08788299560547, 68.78484344482422, 73.48180389404297, 78.17876434326172, 82.87572479248047, 87.57268524169922, 92.26963806152344, 96.96659851074219, 101.66355895996094, 106.36051940917969, 111.05747985839844, 115.75444030761719, 120.45140075683594, 125.14836120605469, 129.84532165527344, 134.5422821044922, 139.23924255371094]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 7.0, 7.0, 9.0, 12.0, 12.0, 17.0, 16.0, 16.0, 11.0, 19.0, 25.0, 29.0, 22.0, 26.0, 25.0, 36.0, 38.0, 37.0, 38.0, 33.0, 34.0, 34.0, 37.0, 33.0, 32.0, 37.0, 26.0, 33.0, 32.0, 32.0, 33.0, 19.0, 32.0, 21.0, 15.0, 17.0, 17.0, 15.0, 19.0, 9.0, 9.0, 6.0, 6.0, 1.0, 7.0, 5.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-94.41848754882812, -91.6406478881836, -88.86280822753906, -86.08496856689453, -83.30712890625, -80.52928924560547, -77.75144958496094, -74.97360229492188, -72.19577026367188, -69.41793060302734, -66.64009094238281, -63.86225128173828, -61.08441162109375, -58.30657196044922, -55.52872848510742, -52.75088882446289, -49.973045349121094, -47.19520568847656, -44.41736602783203, -41.6395263671875, -38.86168670654297, -36.08384704589844, -33.30600357055664, -30.52816390991211, -27.750324249267578, -24.972484588623047, -22.194644927978516, -19.41680335998535, -16.63896369934082, -13.861124038696289, -11.083282470703125, -8.305442810058594, -5.5276031494140625, -2.749763011932373, 0.028077125549316406, 2.805917739868164, 5.583757400512695, 8.361597061157227, 11.13943862915039, 13.917278289794922, 16.695117950439453, 19.472957611083984, 22.250797271728516, 25.02863883972168, 27.80647850036621, 30.584318161010742, 33.362159729003906, 36.13999938964844, 38.91783905029297, 41.6956787109375, 44.47351837158203, 47.25135803222656, 50.029197692871094, 52.807037353515625, 55.58488082885742, 58.36272048950195, 61.140560150146484, 63.918399810791016, 66.69624328613281, 69.47408294677734, 72.25192260742188, 75.0297622680664, 77.80760192871094, 80.58544158935547, 83.36328125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 9.0, 12.0, 23.0, 25.0, 44.0, 72.0, 89.0, 128.0, 171.0, 277.0, 406.0, 611.0, 843.0, 1258.0, 1989.0, 2768.0, 4172.0, 6570.0, 10142.0, 15855.0, 24937.0, 40619.0, 67477.0, 117494.0, 207609.0, 223413.0, 128906.0, 73879.0, 43693.0, 26540.0, 16848.0, 10732.0, 6964.0, 4637.0, 3034.0, 2044.0, 1310.0, 910.0, 636.0, 439.0, 295.0, 188.0, 152.0, 98.0, 71.0, 56.0, 28.0, 24.0, 19.0, 11.0, 9.0, 6.0, 7.0, 2.0, 3.0, 0.0, 0.0, 3.0], "bins": [-91.6875, -88.7373046875, -85.787109375, -82.8369140625, -79.88671875, -76.9365234375, -73.986328125, -71.0361328125, -68.0859375, -65.1357421875, -62.185546875, -59.2353515625, -56.28515625, -53.3349609375, -50.384765625, -47.4345703125, -44.484375, -41.5341796875, -38.583984375, -35.6337890625, -32.68359375, -29.7333984375, -26.783203125, -23.8330078125, -20.8828125, -17.9326171875, -14.982421875, -12.0322265625, -9.08203125, -6.1318359375, -3.181640625, -0.2314453125, 2.71875, 5.6689453125, 8.619140625, 11.5693359375, 14.51953125, 17.4697265625, 20.419921875, 23.3701171875, 26.3203125, 29.2705078125, 32.220703125, 35.1708984375, 38.12109375, 41.0712890625, 44.021484375, 46.9716796875, 49.921875, 52.8720703125, 55.822265625, 58.7724609375, 61.72265625, 64.6728515625, 67.623046875, 70.5732421875, 73.5234375, 76.4736328125, 79.423828125, 82.3740234375, 85.32421875, 88.2744140625, 91.224609375, 94.1748046875, 97.125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 3.0, 5.0, 7.0, 7.0, 14.0, 10.0, 20.0, 18.0, 22.0, 25.0, 20.0, 16.0, 28.0, 30.0, 36.0, 34.0, 36.0, 36.0, 41.0, 37.0, 43.0, 35.0, 44.0, 34.0, 35.0, 47.0, 33.0, 55.0, 29.0, 27.0, 18.0, 21.0, 19.0, 18.0, 13.0, 19.0, 14.0, 8.0, 9.0, 10.0, 7.0, 4.0, 1.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.1875, -75.587890625, -72.98828125, -70.388671875, -67.7890625, -65.189453125, -62.58984375, -59.990234375, -57.390625, -54.791015625, -52.19140625, -49.591796875, -46.9921875, -44.392578125, -41.79296875, -39.193359375, -36.59375, -33.994140625, -31.39453125, -28.794921875, -26.1953125, -23.595703125, -20.99609375, -18.396484375, -15.796875, -13.197265625, -10.59765625, -7.998046875, -5.3984375, -2.798828125, -0.19921875, 2.400390625, 5.0, 7.599609375, 10.19921875, 12.798828125, 15.3984375, 17.998046875, 20.59765625, 23.197265625, 25.796875, 28.396484375, 30.99609375, 33.595703125, 36.1953125, 38.794921875, 41.39453125, 43.994140625, 46.59375, 49.193359375, 51.79296875, 54.392578125, 56.9921875, 59.591796875, 62.19140625, 64.791015625, 67.390625, 69.990234375, 72.58984375, 75.189453125, 77.7890625, 80.388671875, 82.98828125, 85.587890625, 88.1875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 8.0, 9.0, 12.0, 19.0, 18.0, 29.0, 61.0, 82.0, 121.0, 217.0, 366.0, 551.0, 816.0, 1408.0, 2145.0, 3495.0, 5782.0, 9523.0, 16474.0, 31207.0, 67502.0, 198287.0, 444514.0, 147835.0, 55498.0, 26354.0, 14484.0, 8355.0, 4994.0, 3094.0, 1922.0, 1249.0, 765.0, 485.0, 307.0, 206.0, 138.0, 66.0, 48.0, 31.0, 28.0, 11.0, 6.0, 5.0, 6.0, 11.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-70.375, -68.05859375, -65.7421875, -63.42578125, -61.109375, -58.79296875, -56.4765625, -54.16015625, -51.84375, -49.52734375, -47.2109375, -44.89453125, -42.578125, -40.26171875, -37.9453125, -35.62890625, -33.3125, -30.99609375, -28.6796875, -26.36328125, -24.046875, -21.73046875, -19.4140625, -17.09765625, -14.78125, -12.46484375, -10.1484375, -7.83203125, -5.515625, -3.19921875, -0.8828125, 1.43359375, 3.75, 6.06640625, 8.3828125, 10.69921875, 13.015625, 15.33203125, 17.6484375, 19.96484375, 22.28125, 24.59765625, 26.9140625, 29.23046875, 31.546875, 33.86328125, 36.1796875, 38.49609375, 40.8125, 43.12890625, 45.4453125, 47.76171875, 50.078125, 52.39453125, 54.7109375, 57.02734375, 59.34375, 61.66015625, 63.9765625, 66.29296875, 68.609375, 70.92578125, 73.2421875, 75.55859375, 77.875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 8.0, 8.0, 9.0, 9.0, 19.0, 12.0, 21.0, 11.0, 22.0, 22.0, 27.0, 23.0, 28.0, 19.0, 36.0, 28.0, 35.0, 39.0, 36.0, 33.0, 37.0, 40.0, 43.0, 33.0, 26.0, 38.0, 40.0, 26.0, 41.0, 27.0, 23.0, 28.0, 16.0, 24.0, 18.0, 13.0, 23.0, 13.0, 9.0, 8.0, 1.0, 2.0, 2.0, 3.0, 1.0, 8.0, 9.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-51.9375, -50.26318359375, -48.5888671875, -46.91455078125, -45.240234375, -43.56591796875, -41.8916015625, -40.21728515625, -38.54296875, -36.86865234375, -35.1943359375, -33.52001953125, -31.845703125, -30.17138671875, -28.4970703125, -26.82275390625, -25.1484375, -23.47412109375, -21.7998046875, -20.12548828125, -18.451171875, -16.77685546875, -15.1025390625, -13.42822265625, -11.75390625, -10.07958984375, -8.4052734375, -6.73095703125, -5.056640625, -3.38232421875, -1.7080078125, -0.03369140625, 1.640625, 3.31494140625, 4.9892578125, 6.66357421875, 8.337890625, 10.01220703125, 11.6865234375, 13.36083984375, 15.03515625, 16.70947265625, 18.3837890625, 20.05810546875, 21.732421875, 23.40673828125, 25.0810546875, 26.75537109375, 28.4296875, 30.10400390625, 31.7783203125, 33.45263671875, 35.126953125, 36.80126953125, 38.4755859375, 40.14990234375, 41.82421875, 43.49853515625, 45.1728515625, 46.84716796875, 48.521484375, 50.19580078125, 51.8701171875, 53.54443359375, 55.21875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 10.0, 12.0, 12.0, 19.0, 22.0, 39.0, 33.0, 55.0, 63.0, 97.0, 125.0, 208.0, 309.0, 477.0, 720.0, 1061.0, 1751.0, 2975.0, 5390.0, 11526.0, 29208.0, 109135.0, 701249.0, 125983.0, 31862.0, 12200.0, 5822.0, 3064.0, 1727.0, 1139.0, 679.0, 482.0, 317.0, 228.0, 160.0, 94.0, 79.0, 60.0, 34.0, 34.0, 39.0, 6.0, 12.0, 10.0, 8.0, 3.0, 6.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-45.9375, -44.48095703125, -43.0244140625, -41.56787109375, -40.111328125, -38.65478515625, -37.1982421875, -35.74169921875, -34.28515625, -32.82861328125, -31.3720703125, -29.91552734375, -28.458984375, -27.00244140625, -25.5458984375, -24.08935546875, -22.6328125, -21.17626953125, -19.7197265625, -18.26318359375, -16.806640625, -15.35009765625, -13.8935546875, -12.43701171875, -10.98046875, -9.52392578125, -8.0673828125, -6.61083984375, -5.154296875, -3.69775390625, -2.2412109375, -0.78466796875, 0.671875, 2.12841796875, 3.5849609375, 5.04150390625, 6.498046875, 7.95458984375, 9.4111328125, 10.86767578125, 12.32421875, 13.78076171875, 15.2373046875, 16.69384765625, 18.150390625, 19.60693359375, 21.0634765625, 22.52001953125, 23.9765625, 25.43310546875, 26.8896484375, 28.34619140625, 29.802734375, 31.25927734375, 32.7158203125, 34.17236328125, 35.62890625, 37.08544921875, 38.5419921875, 39.99853515625, 41.455078125, 42.91162109375, 44.3681640625, 45.82470703125, 47.28125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 7.0, 5.0, 8.0, 9.0, 7.0, 14.0, 18.0, 24.0, 15.0, 39.0, 26.0, 38.0, 57.0, 51.0, 68.0, 69.0, 78.0, 72.0, 71.0, 68.0, 48.0, 37.0, 30.0, 28.0, 25.0, 17.0, 12.0, 10.0, 8.0, 6.0, 7.0, 7.0, 3.0, 9.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003269195556640625, -0.003161996603012085, -0.003054797649383545, -0.002947598695755005, -0.002840399742126465, -0.002733200788497925, -0.0026260018348693848, -0.0025188028812408447, -0.0024116039276123047, -0.0023044049739837646, -0.0021972060203552246, -0.0020900070667266846, -0.0019828081130981445, -0.0018756091594696045, -0.0017684102058410645, -0.0016612112522125244, -0.0015540122985839844, -0.0014468133449554443, -0.0013396143913269043, -0.0012324154376983643, -0.0011252164840698242, -0.0010180175304412842, -0.0009108185768127441, -0.0008036196231842041, -0.0006964206695556641, -0.000589221715927124, -0.000482022762298584, -0.00037482380867004395, -0.0002676248550415039, -0.00016042590141296387, -5.322694778442383e-05, 5.397200584411621e-05, 0.00016117095947265625, 0.0002683699131011963, 0.00037556886672973633, 0.00048276782035827637, 0.0005899667739868164, 0.0006971657276153564, 0.0008043646812438965, 0.0009115636348724365, 0.0010187625885009766, 0.0011259615421295166, 0.0012331604957580566, 0.0013403594493865967, 0.0014475584030151367, 0.0015547573566436768, 0.0016619563102722168, 0.0017691552639007568, 0.0018763542175292969, 0.001983553171157837, 0.002090752124786377, 0.002197951078414917, 0.002305150032043457, 0.002412348985671997, 0.002519547939300537, 0.002626746892929077, 0.002733945846557617, 0.0028411448001861572, 0.0029483437538146973, 0.0030555427074432373, 0.0031627416610717773, 0.0032699406147003174, 0.0033771395683288574, 0.0034843385219573975, 0.0035915374755859375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 5.0, 5.0, 8.0, 17.0, 18.0, 31.0, 46.0, 63.0, 84.0, 142.0, 182.0, 309.0, 435.0, 684.0, 1068.0, 1703.0, 2784.0, 4693.0, 8178.0, 15640.0, 33558.0, 92243.0, 453097.0, 299860.0, 73199.0, 28398.0, 13706.0, 7328.0, 4173.0, 2466.0, 1548.0, 1009.0, 624.0, 395.0, 267.0, 203.0, 137.0, 80.0, 52.0, 38.0, 20.0, 24.0, 11.0, 10.0, 7.0, 4.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-89.8125, -86.9970703125, -84.181640625, -81.3662109375, -78.55078125, -75.7353515625, -72.919921875, -70.1044921875, -67.2890625, -64.4736328125, -61.658203125, -58.8427734375, -56.02734375, -53.2119140625, -50.396484375, -47.5810546875, -44.765625, -41.9501953125, -39.134765625, -36.3193359375, -33.50390625, -30.6884765625, -27.873046875, -25.0576171875, -22.2421875, -19.4267578125, -16.611328125, -13.7958984375, -10.98046875, -8.1650390625, -5.349609375, -2.5341796875, 0.28125, 3.0966796875, 5.912109375, 8.7275390625, 11.54296875, 14.3583984375, 17.173828125, 19.9892578125, 22.8046875, 25.6201171875, 28.435546875, 31.2509765625, 34.06640625, 36.8818359375, 39.697265625, 42.5126953125, 45.328125, 48.1435546875, 50.958984375, 53.7744140625, 56.58984375, 59.4052734375, 62.220703125, 65.0361328125, 67.8515625, 70.6669921875, 73.482421875, 76.2978515625, 79.11328125, 81.9287109375, 84.744140625, 87.5595703125, 90.375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 5.0, 5.0, 5.0, 6.0, 6.0, 7.0, 8.0, 15.0, 14.0, 12.0, 13.0, 20.0, 28.0, 45.0, 57.0, 65.0, 122.0, 129.0, 121.0, 86.0, 64.0, 28.0, 28.0, 16.0, 16.0, 14.0, 11.0, 14.0, 8.0, 5.0, 5.0, 6.0, 2.0, 3.0, 4.0, 2.0, 5.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.3125, -23.566162109375, -22.81982421875, -22.073486328125, -21.3271484375, -20.580810546875, -19.83447265625, -19.088134765625, -18.341796875, -17.595458984375, -16.84912109375, -16.102783203125, -15.3564453125, -14.610107421875, -13.86376953125, -13.117431640625, -12.37109375, -11.624755859375, -10.87841796875, -10.132080078125, -9.3857421875, -8.639404296875, -7.89306640625, -7.146728515625, -6.400390625, -5.654052734375, -4.90771484375, -4.161376953125, -3.4150390625, -2.668701171875, -1.92236328125, -1.176025390625, -0.4296875, 0.316650390625, 1.06298828125, 1.809326171875, 2.5556640625, 3.302001953125, 4.04833984375, 4.794677734375, 5.541015625, 6.287353515625, 7.03369140625, 7.780029296875, 8.5263671875, 9.272705078125, 10.01904296875, 10.765380859375, 11.51171875, 12.258056640625, 13.00439453125, 13.750732421875, 14.4970703125, 15.243408203125, 15.98974609375, 16.736083984375, 17.482421875, 18.228759765625, 18.97509765625, 19.721435546875, 20.4677734375, 21.214111328125, 21.96044921875, 22.706787109375, 23.453125]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 5.0, 11.0, 10.0, 7.0, 22.0, 25.0, 33.0, 47.0, 44.0, 79.0, 81.0, 91.0, 82.0, 88.0, 73.0, 44.0, 47.0, 38.0, 34.0, 33.0, 25.0, 17.0, 15.0, 16.0, 8.0, 5.0, 5.0, 2.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.10484313964844, -123.93560028076172, -119.766357421875, -115.59710693359375, -111.42786407470703, -107.25862121582031, -103.0893783569336, -98.92013549804688, -94.75088500976562, -90.5816421508789, -86.41239929199219, -82.24314880371094, -78.07390594482422, -73.9046630859375, -69.73542022705078, -65.56617736816406, -61.396934509277344, -57.227691650390625, -53.05844497680664, -48.88920211791992, -44.71995544433594, -40.55071258544922, -36.3814697265625, -32.21222686767578, -28.042980194091797, -23.873735427856445, -19.704490661621094, -15.535247802734375, -11.366003036499023, -7.196758270263672, -3.027515411376953, 1.1417293548583984, 5.31097412109375, 9.480218887329102, 13.649462699890137, 17.818706512451172, 21.987951278686523, 26.157196044921875, 30.326438903808594, 34.49568176269531, 38.6649284362793, 42.834171295166016, 47.00341796875, 51.17266082763672, 55.34190368652344, 59.51115036010742, 63.68039321899414, 67.84963989257812, 72.01888275146484, 76.18812561035156, 80.35736846923828, 84.526611328125, 88.69586181640625, 92.86510467529297, 97.03434753417969, 101.2035903930664, 105.37283325195312, 109.54207611083984, 113.71131896972656, 117.88056945800781, 122.04981231689453, 126.21905517578125, 130.3883056640625, 134.5575408935547, 138.72679138183594]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 0.0, 9.0, 5.0, 9.0, 6.0, 6.0, 12.0, 7.0, 18.0, 11.0, 12.0, 18.0, 15.0, 17.0, 21.0, 23.0, 18.0, 28.0, 27.0, 21.0, 36.0, 46.0, 38.0, 26.0, 39.0, 37.0, 36.0, 27.0, 33.0, 25.0, 33.0, 32.0, 26.0, 22.0, 31.0, 22.0, 24.0, 30.0, 31.0, 17.0, 19.0, 11.0, 9.0, 8.0, 20.0, 1.0, 14.0, 5.0, 8.0, 5.0, 4.0, 3.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-69.20663452148438, -66.94244384765625, -64.67825317382812, -62.414066314697266, -60.14987564086914, -57.88568878173828, -55.621498107910156, -53.35730743408203, -51.093116760253906, -48.82892608642578, -46.56473922729492, -44.3005485534668, -42.03635787963867, -39.77217102050781, -37.50798034667969, -35.24378967285156, -32.9796028137207, -30.71541404724121, -28.451223373413086, -26.187034606933594, -23.92284393310547, -21.658655166625977, -19.394466400146484, -17.13027572631836, -14.866086959838867, -12.601897239685059, -10.33770751953125, -8.073518753051758, -5.809329032897949, -3.5451393127441406, -1.2809505462646484, 0.9832391738891602, 3.2474288940429688, 5.511618614196777, 7.775807857513428, 10.039997100830078, 12.304186820983887, 14.568376541137695, 16.832565307617188, 19.096755981445312, 21.360944747924805, 23.625133514404297, 25.889324188232422, 28.153512954711914, 30.417701721191406, 32.68189239501953, 34.946083068847656, 37.210269927978516, 39.47446060180664, 41.738651275634766, 44.002838134765625, 46.26702880859375, 48.531219482421875, 50.79541015625, 53.05959701538086, 55.323787689208984, 57.587974548339844, 59.85216522216797, 62.11635208129883, 64.38053894042969, 66.64472961425781, 68.90892028808594, 71.17311096191406, 73.43730163574219, 75.70149230957031]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 4.0, 9.0, 7.0, 11.0, 8.0, 11.0, 15.0, 25.0, 35.0, 45.0, 69.0, 118.0, 170.0, 277.0, 439.0, 768.0, 1192.0, 1829.0, 2783.0, 4304.0, 6808.0, 11015.0, 17936.0, 30053.0, 51353.0, 88735.0, 149803.0, 206444.0, 185483.0, 118491.0, 68863.0, 39607.0, 23444.0, 14339.0, 8789.0, 5514.0, 3486.0, 2205.0, 1460.0, 892.0, 632.0, 370.0, 236.0, 152.0, 110.0, 67.0, 38.0, 30.0, 16.0, 20.0, 15.0, 8.0, 8.0, 3.0, 6.0, 9.0, 2.0, 3.0, 0.0, 2.0], "bins": [-143.625, -139.103515625, -134.58203125, -130.060546875, -125.5390625, -121.017578125, -116.49609375, -111.974609375, -107.453125, -102.931640625, -98.41015625, -93.888671875, -89.3671875, -84.845703125, -80.32421875, -75.802734375, -71.28125, -66.759765625, -62.23828125, -57.716796875, -53.1953125, -48.673828125, -44.15234375, -39.630859375, -35.109375, -30.587890625, -26.06640625, -21.544921875, -17.0234375, -12.501953125, -7.98046875, -3.458984375, 1.0625, 5.583984375, 10.10546875, 14.626953125, 19.1484375, 23.669921875, 28.19140625, 32.712890625, 37.234375, 41.755859375, 46.27734375, 50.798828125, 55.3203125, 59.841796875, 64.36328125, 68.884765625, 73.40625, 77.927734375, 82.44921875, 86.970703125, 91.4921875, 96.013671875, 100.53515625, 105.056640625, 109.578125, 114.099609375, 118.62109375, 123.142578125, 127.6640625, 132.185546875, 136.70703125, 141.228515625, 145.75]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 6.0, 5.0, 5.0, 2.0, 3.0, 9.0, 14.0, 9.0, 15.0, 20.0, 17.0, 20.0, 26.0, 17.0, 23.0, 23.0, 24.0, 29.0, 30.0, 36.0, 30.0, 40.0, 38.0, 34.0, 30.0, 36.0, 32.0, 31.0, 34.0, 33.0, 29.0, 23.0, 29.0, 25.0, 30.0, 31.0, 24.0, 20.0, 17.0, 22.0, 12.0, 13.0, 12.0, 6.0, 8.0, 5.0, 9.0, 8.0, 1.0, 9.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-49.25, -47.5712890625, -45.892578125, -44.2138671875, -42.53515625, -40.8564453125, -39.177734375, -37.4990234375, -35.8203125, -34.1416015625, -32.462890625, -30.7841796875, -29.10546875, -27.4267578125, -25.748046875, -24.0693359375, -22.390625, -20.7119140625, -19.033203125, -17.3544921875, -15.67578125, -13.9970703125, -12.318359375, -10.6396484375, -8.9609375, -7.2822265625, -5.603515625, -3.9248046875, -2.24609375, -0.5673828125, 1.111328125, 2.7900390625, 4.46875, 6.1474609375, 7.826171875, 9.5048828125, 11.18359375, 12.8623046875, 14.541015625, 16.2197265625, 17.8984375, 19.5771484375, 21.255859375, 22.9345703125, 24.61328125, 26.2919921875, 27.970703125, 29.6494140625, 31.328125, 33.0068359375, 34.685546875, 36.3642578125, 38.04296875, 39.7216796875, 41.400390625, 43.0791015625, 44.7578125, 46.4365234375, 48.115234375, 49.7939453125, 51.47265625, 53.1513671875, 54.830078125, 56.5087890625, 58.1875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 7.0, 7.0, 11.0, 16.0, 23.0, 35.0, 59.0, 93.0, 144.0, 200.0, 297.0, 422.0, 632.0, 951.0, 1493.0, 2216.0, 3285.0, 5115.0, 7900.0, 12351.0, 19702.0, 31244.0, 48896.0, 78536.0, 119966.0, 165863.0, 175232.0, 133173.0, 88037.0, 56033.0, 34904.0, 21820.0, 14071.0, 8930.0, 5858.0, 3740.0, 2500.0, 1596.0, 1102.0, 698.0, 453.0, 319.0, 211.0, 147.0, 81.0, 55.0, 51.0, 30.0, 21.0, 12.0, 8.0, 9.0, 3.0, 4.0, 0.0, 0.0, 1.0, 3.0], "bins": [-106.1875, -102.8828125, -99.578125, -96.2734375, -92.96875, -89.6640625, -86.359375, -83.0546875, -79.75, -76.4453125, -73.140625, -69.8359375, -66.53125, -63.2265625, -59.921875, -56.6171875, -53.3125, -50.0078125, -46.703125, -43.3984375, -40.09375, -36.7890625, -33.484375, -30.1796875, -26.875, -23.5703125, -20.265625, -16.9609375, -13.65625, -10.3515625, -7.046875, -3.7421875, -0.4375, 2.8671875, 6.171875, 9.4765625, 12.78125, 16.0859375, 19.390625, 22.6953125, 26.0, 29.3046875, 32.609375, 35.9140625, 39.21875, 42.5234375, 45.828125, 49.1328125, 52.4375, 55.7421875, 59.046875, 62.3515625, 65.65625, 68.9609375, 72.265625, 75.5703125, 78.875, 82.1796875, 85.484375, 88.7890625, 92.09375, 95.3984375, 98.703125, 102.0078125, 105.3125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 0.0, 9.0, 8.0, 9.0, 8.0, 9.0, 11.0, 12.0, 13.0, 22.0, 23.0, 31.0, 38.0, 29.0, 35.0, 35.0, 38.0, 44.0, 50.0, 45.0, 46.0, 46.0, 50.0, 33.0, 36.0, 46.0, 38.0, 34.0, 32.0, 27.0, 27.0, 16.0, 16.0, 13.0, 18.0, 4.0, 15.0, 6.0, 9.0, 7.0, 6.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.21875, -44.82958984375, -43.4404296875, -42.05126953125, -40.662109375, -39.27294921875, -37.8837890625, -36.49462890625, -35.10546875, -33.71630859375, -32.3271484375, -30.93798828125, -29.548828125, -28.15966796875, -26.7705078125, -25.38134765625, -23.9921875, -22.60302734375, -21.2138671875, -19.82470703125, -18.435546875, -17.04638671875, -15.6572265625, -14.26806640625, -12.87890625, -11.48974609375, -10.1005859375, -8.71142578125, -7.322265625, -5.93310546875, -4.5439453125, -3.15478515625, -1.765625, -0.37646484375, 1.0126953125, 2.40185546875, 3.791015625, 5.18017578125, 6.5693359375, 7.95849609375, 9.34765625, 10.73681640625, 12.1259765625, 13.51513671875, 14.904296875, 16.29345703125, 17.6826171875, 19.07177734375, 20.4609375, 21.85009765625, 23.2392578125, 24.62841796875, 26.017578125, 27.40673828125, 28.7958984375, 30.18505859375, 31.57421875, 32.96337890625, 34.3525390625, 35.74169921875, 37.130859375, 38.52001953125, 39.9091796875, 41.29833984375, 42.6875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 7.0, 17.0, 15.0, 41.0, 37.0, 59.0, 81.0, 112.0, 162.0, 210.0, 312.0, 499.0, 730.0, 1130.0, 1861.0, 3145.0, 5500.0, 11643.0, 29733.0, 108378.0, 613000.0, 196363.0, 43046.0, 15648.0, 7010.0, 3724.0, 2169.0, 1250.0, 907.0, 553.0, 398.0, 252.0, 183.0, 112.0, 80.0, 59.0, 46.0, 19.0, 22.0, 14.0, 9.0, 6.0, 1.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-117.9375, -113.9619140625, -109.986328125, -106.0107421875, -102.03515625, -98.0595703125, -94.083984375, -90.1083984375, -86.1328125, -82.1572265625, -78.181640625, -74.2060546875, -70.23046875, -66.2548828125, -62.279296875, -58.3037109375, -54.328125, -50.3525390625, -46.376953125, -42.4013671875, -38.42578125, -34.4501953125, -30.474609375, -26.4990234375, -22.5234375, -18.5478515625, -14.572265625, -10.5966796875, -6.62109375, -2.6455078125, 1.330078125, 5.3056640625, 9.28125, 13.2568359375, 17.232421875, 21.2080078125, 25.18359375, 29.1591796875, 33.134765625, 37.1103515625, 41.0859375, 45.0615234375, 49.037109375, 53.0126953125, 56.98828125, 60.9638671875, 64.939453125, 68.9150390625, 72.890625, 76.8662109375, 80.841796875, 84.8173828125, 88.79296875, 92.7685546875, 96.744140625, 100.7197265625, 104.6953125, 108.6708984375, 112.646484375, 116.6220703125, 120.59765625, 124.5732421875, 128.548828125, 132.5244140625, 136.5]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 7.0, 9.0, 15.0, 15.0, 27.0, 32.0, 66.0, 92.0, 111.0, 122.0, 143.0, 111.0, 76.0, 47.0, 44.0, 17.0, 20.0, 10.0, 11.0, 5.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0065765380859375, -0.006364762783050537, -0.006152987480163574, -0.005941212177276611, -0.0057294368743896484, -0.0055176615715026855, -0.005305886268615723, -0.00509411096572876, -0.004882335662841797, -0.004670560359954834, -0.004458785057067871, -0.004247009754180908, -0.004035234451293945, -0.0038234591484069824, -0.0036116838455200195, -0.0033999085426330566, -0.0031881332397460938, -0.002976357936859131, -0.002764582633972168, -0.002552807331085205, -0.002341032028198242, -0.0021292567253112793, -0.0019174814224243164, -0.0017057061195373535, -0.0014939308166503906, -0.0012821555137634277, -0.0010703802108764648, -0.000858604907989502, -0.0006468296051025391, -0.00043505430221557617, -0.00022327899932861328, -1.150369644165039e-05, 0.0002002716064453125, 0.0004120469093322754, 0.0006238222122192383, 0.0008355975151062012, 0.001047372817993164, 0.001259148120880127, 0.0014709234237670898, 0.0016826987266540527, 0.0018944740295410156, 0.0021062493324279785, 0.0023180246353149414, 0.0025297999382019043, 0.002741575241088867, 0.00295335054397583, 0.003165125846862793, 0.003376901149749756, 0.0035886764526367188, 0.0038004517555236816, 0.0040122270584106445, 0.004224002361297607, 0.00443577766418457, 0.004647552967071533, 0.004859328269958496, 0.005071103572845459, 0.005282878875732422, 0.005494654178619385, 0.005706429481506348, 0.0059182047843933105, 0.0061299800872802734, 0.006341755390167236, 0.006553530693054199, 0.006765305995941162, 0.006977081298828125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 8.0, 8.0, 7.0, 9.0, 17.0, 19.0, 29.0, 39.0, 52.0, 58.0, 88.0, 132.0, 188.0, 261.0, 361.0, 497.0, 716.0, 1171.0, 1786.0, 2834.0, 4871.0, 9435.0, 22981.0, 84728.0, 614087.0, 231188.0, 41897.0, 14189.0, 6570.0, 3692.0, 2136.0, 1414.0, 938.0, 637.0, 422.0, 327.0, 214.0, 154.0, 104.0, 66.0, 59.0, 42.0, 44.0, 14.0, 23.0, 15.0, 4.0, 9.0, 7.0, 6.0, 4.0, 5.0, 1.0, 2.0], "bins": [-146.25, -142.0419921875, -137.833984375, -133.6259765625, -129.41796875, -125.2099609375, -121.001953125, -116.7939453125, -112.5859375, -108.3779296875, -104.169921875, -99.9619140625, -95.75390625, -91.5458984375, -87.337890625, -83.1298828125, -78.921875, -74.7138671875, -70.505859375, -66.2978515625, -62.08984375, -57.8818359375, -53.673828125, -49.4658203125, -45.2578125, -41.0498046875, -36.841796875, -32.6337890625, -28.42578125, -24.2177734375, -20.009765625, -15.8017578125, -11.59375, -7.3857421875, -3.177734375, 1.0302734375, 5.23828125, 9.4462890625, 13.654296875, 17.8623046875, 22.0703125, 26.2783203125, 30.486328125, 34.6943359375, 38.90234375, 43.1103515625, 47.318359375, 51.5263671875, 55.734375, 59.9423828125, 64.150390625, 68.3583984375, 72.56640625, 76.7744140625, 80.982421875, 85.1904296875, 89.3984375, 93.6064453125, 97.814453125, 102.0224609375, 106.23046875, 110.4384765625, 114.646484375, 118.8544921875, 123.0625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 3.0, 2.0, 4.0, 1.0, 5.0, 2.0, 7.0, 8.0, 9.0, 12.0, 32.0, 58.0, 82.0, 118.0, 159.0, 172.0, 96.0, 65.0, 43.0, 35.0, 28.0, 15.0, 11.0, 7.0, 5.0, 2.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.53125, -38.3232421875, -37.115234375, -35.9072265625, -34.69921875, -33.4912109375, -32.283203125, -31.0751953125, -29.8671875, -28.6591796875, -27.451171875, -26.2431640625, -25.03515625, -23.8271484375, -22.619140625, -21.4111328125, -20.203125, -18.9951171875, -17.787109375, -16.5791015625, -15.37109375, -14.1630859375, -12.955078125, -11.7470703125, -10.5390625, -9.3310546875, -8.123046875, -6.9150390625, -5.70703125, -4.4990234375, -3.291015625, -2.0830078125, -0.875, 0.3330078125, 1.541015625, 2.7490234375, 3.95703125, 5.1650390625, 6.373046875, 7.5810546875, 8.7890625, 9.9970703125, 11.205078125, 12.4130859375, 13.62109375, 14.8291015625, 16.037109375, 17.2451171875, 18.453125, 19.6611328125, 20.869140625, 22.0771484375, 23.28515625, 24.4931640625, 25.701171875, 26.9091796875, 28.1171875, 29.3251953125, 30.533203125, 31.7412109375, 32.94921875, 34.1572265625, 35.365234375, 36.5732421875, 37.78125]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 6.0, 11.0, 19.0, 14.0, 24.0, 30.0, 42.0, 36.0, 64.0, 76.0, 97.0, 76.0, 69.0, 89.0, 61.0, 58.0, 45.0, 43.0, 31.0, 20.0, 21.0, 14.0, 6.0, 13.0, 10.0, 4.0, 4.0, 7.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.18022918701172, -100.01284790039062, -96.84546661376953, -93.67808532714844, -90.51070404052734, -87.34332275390625, -84.17594909667969, -81.0085678100586, -77.8411865234375, -74.6738052368164, -71.50642395019531, -68.33904266357422, -65.17166137695312, -62.0042839050293, -58.8369026184082, -55.669525146484375, -52.502140045166016, -49.33475875854492, -46.16737747192383, -43.0, -39.832618713378906, -36.66523742675781, -33.49785614013672, -30.330476760864258, -27.163095474243164, -23.99571418762207, -20.82833480834961, -17.660953521728516, -14.493573188781738, -11.326192855834961, -8.158811569213867, -4.991432189941406, -1.8240509033203125, 1.343329668045044, 4.5107102394104, 7.678091049194336, 10.845471382141113, 14.01285171508789, 17.180233001708984, 20.347612380981445, 23.51499366760254, 26.682374954223633, 29.849754333496094, 33.01713562011719, 36.18451690673828, 39.351898193359375, 42.51927947998047, 45.6866569519043, 48.85403823852539, 52.021419525146484, 55.18880081176758, 58.356178283691406, 61.5235595703125, 64.6909408569336, 67.85832214355469, 71.02570343017578, 74.19308471679688, 77.36046600341797, 80.52784729003906, 83.69522857666016, 86.86260986328125, 90.02998352050781, 93.19737243652344, 96.36474609375, 99.5321273803711]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 3.0, 8.0, 9.0, 8.0, 11.0, 20.0, 15.0, 14.0, 23.0, 22.0, 21.0, 26.0, 25.0, 26.0, 28.0, 42.0, 41.0, 34.0, 43.0, 45.0, 31.0, 43.0, 38.0, 33.0, 33.0, 34.0, 30.0, 25.0, 27.0, 35.0, 27.0, 27.0, 26.0, 23.0, 16.0, 22.0, 9.0, 6.0, 12.0, 6.0, 3.0, 10.0, 9.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-65.66488647460938, -63.542823791503906, -61.42076110839844, -59.298702239990234, -57.176639556884766, -55.0545768737793, -52.932518005371094, -50.810455322265625, -48.688392639160156, -46.56632995605469, -44.44426727294922, -42.322208404541016, -40.20014572143555, -38.07808303833008, -35.956024169921875, -33.833961486816406, -31.711898803710938, -29.58983612060547, -27.467775344848633, -25.345714569091797, -23.223651885986328, -21.10158920288086, -18.979528427124023, -16.857467651367188, -14.735404968261719, -12.613343238830566, -10.491281509399414, -8.369219779968262, -6.247158050537109, -4.125096321105957, -2.0030345916748047, 0.11902713775634766, 2.2410964965820312, 4.363158226013184, 6.485219955444336, 8.607281684875488, 10.72934341430664, 12.851405143737793, 14.973466873168945, 17.09552764892578, 19.21759033203125, 21.33965301513672, 23.461713790893555, 25.58377456665039, 27.70583724975586, 29.827899932861328, 31.949960708618164, 34.072021484375, 36.19408416748047, 38.31614685058594, 40.438209533691406, 42.56026840209961, 44.68233108520508, 46.80439376831055, 48.92645263671875, 51.04851531982422, 53.17057800292969, 55.292640686035156, 57.414703369140625, 59.53676223754883, 61.6588249206543, 63.780887603759766, 65.90294647216797, 68.02500915527344, 70.1470718383789]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 4.0, 8.0, 11.0, 21.0, 28.0, 31.0, 70.0, 80.0, 176.0, 270.0, 396.0, 597.0, 851.0, 1266.0, 1935.0, 2890.0, 4546.0, 6744.0, 10508.0, 15609.0, 24217.0, 37352.0, 60844.0, 100113.0, 176193.0, 364817.0, 908995.0, 1260658.0, 620255.0, 244699.0, 131133.0, 77983.0, 48714.0, 30966.0, 20220.0, 13257.0, 8948.0, 6034.0, 4041.0, 2834.0, 1912.0, 1261.0, 870.0, 594.0, 384.0, 279.0, 206.0, 150.0, 105.0, 68.0, 49.0, 35.0, 16.0, 10.0, 10.0, 12.0, 6.0, 3.0, 9.0, 3.0], "bins": [-65.875, -63.76953125, -61.6640625, -59.55859375, -57.453125, -55.34765625, -53.2421875, -51.13671875, -49.03125, -46.92578125, -44.8203125, -42.71484375, -40.609375, -38.50390625, -36.3984375, -34.29296875, -32.1875, -30.08203125, -27.9765625, -25.87109375, -23.765625, -21.66015625, -19.5546875, -17.44921875, -15.34375, -13.23828125, -11.1328125, -9.02734375, -6.921875, -4.81640625, -2.7109375, -0.60546875, 1.5, 3.60546875, 5.7109375, 7.81640625, 9.921875, 12.02734375, 14.1328125, 16.23828125, 18.34375, 20.44921875, 22.5546875, 24.66015625, 26.765625, 28.87109375, 30.9765625, 33.08203125, 35.1875, 37.29296875, 39.3984375, 41.50390625, 43.609375, 45.71484375, 47.8203125, 49.92578125, 52.03125, 54.13671875, 56.2421875, 58.34765625, 60.453125, 62.55859375, 64.6640625, 66.76953125, 68.875]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 6.0, 3.0, 10.0, 12.0, 6.0, 7.0, 8.0, 15.0, 19.0, 24.0, 21.0, 26.0, 28.0, 25.0, 33.0, 37.0, 35.0, 46.0, 32.0, 47.0, 37.0, 31.0, 45.0, 27.0, 42.0, 39.0, 25.0, 37.0, 23.0, 25.0, 33.0, 25.0, 21.0, 23.0, 24.0, 18.0, 15.0, 9.0, 11.0, 11.0, 8.0, 7.0, 4.0, 10.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.234375, -30.121826171875, -29.00927734375, -27.896728515625, -26.7841796875, -25.671630859375, -24.55908203125, -23.446533203125, -22.333984375, -21.221435546875, -20.10888671875, -18.996337890625, -17.8837890625, -16.771240234375, -15.65869140625, -14.546142578125, -13.43359375, -12.321044921875, -11.20849609375, -10.095947265625, -8.9833984375, -7.870849609375, -6.75830078125, -5.645751953125, -4.533203125, -3.420654296875, -2.30810546875, -1.195556640625, -0.0830078125, 1.029541015625, 2.14208984375, 3.254638671875, 4.3671875, 5.479736328125, 6.59228515625, 7.704833984375, 8.8173828125, 9.929931640625, 11.04248046875, 12.155029296875, 13.267578125, 14.380126953125, 15.49267578125, 16.605224609375, 17.7177734375, 18.830322265625, 19.94287109375, 21.055419921875, 22.16796875, 23.280517578125, 24.39306640625, 25.505615234375, 26.6181640625, 27.730712890625, 28.84326171875, 29.955810546875, 31.068359375, 32.180908203125, 33.29345703125, 34.406005859375, 35.5185546875, 36.631103515625, 37.74365234375, 38.856201171875, 39.96875]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 6.0, 2.0, 3.0, 11.0, 9.0, 19.0, 26.0, 39.0, 85.0, 115.0, 137.0, 258.0, 375.0, 624.0, 910.0, 1559.0, 2451.0, 4222.0, 7204.0, 12406.0, 22037.0, 40388.0, 75333.0, 145667.0, 299121.0, 664903.0, 1376993.0, 814317.0, 358881.0, 172334.0, 87724.0, 46577.0, 25720.0, 14176.0, 8018.0, 4662.0, 2765.0, 1640.0, 957.0, 577.0, 361.0, 241.0, 168.0, 93.0, 61.0, 32.0, 25.0, 20.0, 17.0, 7.0, 5.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-64.3125, -62.2119140625, -60.111328125, -58.0107421875, -55.91015625, -53.8095703125, -51.708984375, -49.6083984375, -47.5078125, -45.4072265625, -43.306640625, -41.2060546875, -39.10546875, -37.0048828125, -34.904296875, -32.8037109375, -30.703125, -28.6025390625, -26.501953125, -24.4013671875, -22.30078125, -20.2001953125, -18.099609375, -15.9990234375, -13.8984375, -11.7978515625, -9.697265625, -7.5966796875, -5.49609375, -3.3955078125, -1.294921875, 0.8056640625, 2.90625, 5.0068359375, 7.107421875, 9.2080078125, 11.30859375, 13.4091796875, 15.509765625, 17.6103515625, 19.7109375, 21.8115234375, 23.912109375, 26.0126953125, 28.11328125, 30.2138671875, 32.314453125, 34.4150390625, 36.515625, 38.6162109375, 40.716796875, 42.8173828125, 44.91796875, 47.0185546875, 49.119140625, 51.2197265625, 53.3203125, 55.4208984375, 57.521484375, 59.6220703125, 61.72265625, 63.8232421875, 65.923828125, 68.0244140625, 70.125]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 8.0, 8.0, 10.0, 17.0, 16.0, 24.0, 28.0, 41.0, 54.0, 70.0, 85.0, 106.0, 152.0, 165.0, 216.0, 262.0, 321.0, 344.0, 379.0, 329.0, 257.0, 265.0, 195.0, 138.0, 115.0, 102.0, 78.0, 64.0, 48.0, 32.0, 32.0, 25.0, 15.0, 16.0, 12.0, 13.0, 8.0, 6.0, 10.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.984375, -19.250244140625, -18.51611328125, -17.781982421875, -17.0478515625, -16.313720703125, -15.57958984375, -14.845458984375, -14.111328125, -13.377197265625, -12.64306640625, -11.908935546875, -11.1748046875, -10.440673828125, -9.70654296875, -8.972412109375, -8.23828125, -7.504150390625, -6.77001953125, -6.035888671875, -5.3017578125, -4.567626953125, -3.83349609375, -3.099365234375, -2.365234375, -1.631103515625, -0.89697265625, -0.162841796875, 0.5712890625, 1.305419921875, 2.03955078125, 2.773681640625, 3.5078125, 4.241943359375, 4.97607421875, 5.710205078125, 6.4443359375, 7.178466796875, 7.91259765625, 8.646728515625, 9.380859375, 10.114990234375, 10.84912109375, 11.583251953125, 12.3173828125, 13.051513671875, 13.78564453125, 14.519775390625, 15.25390625, 15.988037109375, 16.72216796875, 17.456298828125, 18.1904296875, 18.924560546875, 19.65869140625, 20.392822265625, 21.126953125, 21.861083984375, 22.59521484375, 23.329345703125, 24.0634765625, 24.797607421875, 25.53173828125, 26.265869140625, 27.0]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 3.0, 5.0, 6.0, 16.0, 23.0, 32.0, 34.0, 41.0, 53.0, 68.0, 77.0, 87.0, 84.0, 76.0, 63.0, 66.0, 51.0, 44.0, 34.0, 26.0, 19.0, 15.0, 15.0, 14.0, 12.0, 5.0, 4.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-70.5233383178711, -68.5509033203125, -66.5784683227539, -64.60603332519531, -62.63359832763672, -60.661163330078125, -58.6887321472168, -56.7162971496582, -54.74386215209961, -52.771427154541016, -50.79899215698242, -48.82655715942383, -46.8541259765625, -44.881690979003906, -42.90925598144531, -40.93682098388672, -38.964385986328125, -36.99195098876953, -35.01951599121094, -33.047080993652344, -31.074647903442383, -29.10221290588379, -27.129779815673828, -25.157344818115234, -23.18490982055664, -21.212474822998047, -19.240039825439453, -17.267606735229492, -15.295171737670898, -13.322736740112305, -11.350302696228027, -9.37786865234375, -7.405429840087891, -5.432995319366455, -3.4605607986450195, -1.488126277923584, 0.48430824279785156, 2.4567432403564453, 4.429177284240723, 6.401611328125, 8.374046325683594, 10.346481323242188, 12.318915367126465, 14.291349411010742, 16.263784408569336, 18.23621940612793, 20.20865249633789, 22.181087493896484, 24.153522491455078, 26.125957489013672, 28.098392486572266, 30.070825576782227, 32.04325866699219, 34.01569366455078, 35.988128662109375, 37.96056365966797, 39.93299865722656, 41.905433654785156, 43.87786865234375, 45.850303649902344, 47.82273864746094, 49.79517364501953, 51.76760482788086, 53.74003982543945, 55.71247482299805]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 1.0, 3.0, 3.0, 11.0, 7.0, 7.0, 15.0, 14.0, 15.0, 14.0, 19.0, 19.0, 28.0, 23.0, 38.0, 33.0, 33.0, 35.0, 47.0, 32.0, 40.0, 38.0, 49.0, 34.0, 47.0, 47.0, 31.0, 37.0, 26.0, 32.0, 28.0, 32.0, 19.0, 15.0, 15.0, 19.0, 23.0, 16.0, 16.0, 11.0, 6.0, 4.0, 4.0, 4.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.359561920166016, -37.024356842041016, -35.68915557861328, -34.35395050048828, -33.01874542236328, -31.68354034423828, -30.348337173461914, -29.013134002685547, -27.677928924560547, -26.342723846435547, -25.00752067565918, -23.672317504882812, -22.337112426757812, -21.001907348632812, -19.666704177856445, -18.331501007080078, -16.996295928955078, -15.661091804504395, -14.325887680053711, -12.990683555603027, -11.655479431152344, -10.32027530670166, -8.985071182250977, -7.649867057800293, -6.314662933349609, -4.979458808898926, -3.644254684448242, -2.3090505599975586, -0.973846435546875, 0.3613576889038086, 1.6965618133544922, 3.031765937805176, 4.366973876953125, 5.702178001403809, 7.037382125854492, 8.372586250305176, 9.70779037475586, 11.042994499206543, 12.378198623657227, 13.71340274810791, 15.048606872558594, 16.383811950683594, 17.71901512145996, 19.054218292236328, 20.389423370361328, 21.724628448486328, 23.059831619262695, 24.395034790039062, 25.730239868164062, 27.065444946289062, 28.40064811706543, 29.735851287841797, 31.071056365966797, 32.4062614440918, 33.74146270751953, 35.07666778564453, 36.41187286376953, 37.74707794189453, 39.08228302001953, 40.417484283447266, 41.752689361572266, 43.087894439697266, 44.423095703125, 45.75830078125, 47.093505859375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 6.0, 10.0, 8.0, 11.0, 17.0, 18.0, 26.0, 46.0, 53.0, 96.0, 143.0, 181.0, 250.0, 406.0, 637.0, 976.0, 1485.0, 2252.0, 3764.0, 6182.0, 10605.0, 18609.0, 32803.0, 60928.0, 116943.0, 241219.0, 265733.0, 131253.0, 67963.0, 36280.0, 20094.0, 11539.0, 6817.0, 4119.0, 2481.0, 1601.0, 994.0, 625.0, 457.0, 295.0, 188.0, 135.0, 88.0, 74.0, 47.0, 34.0, 18.0, 12.0, 11.0, 13.0, 6.0, 9.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-43.375, -41.93310546875, -40.4912109375, -39.04931640625, -37.607421875, -36.16552734375, -34.7236328125, -33.28173828125, -31.83984375, -30.39794921875, -28.9560546875, -27.51416015625, -26.072265625, -24.63037109375, -23.1884765625, -21.74658203125, -20.3046875, -18.86279296875, -17.4208984375, -15.97900390625, -14.537109375, -13.09521484375, -11.6533203125, -10.21142578125, -8.76953125, -7.32763671875, -5.8857421875, -4.44384765625, -3.001953125, -1.56005859375, -0.1181640625, 1.32373046875, 2.765625, 4.20751953125, 5.6494140625, 7.09130859375, 8.533203125, 9.97509765625, 11.4169921875, 12.85888671875, 14.30078125, 15.74267578125, 17.1845703125, 18.62646484375, 20.068359375, 21.51025390625, 22.9521484375, 24.39404296875, 25.8359375, 27.27783203125, 28.7197265625, 30.16162109375, 31.603515625, 33.04541015625, 34.4873046875, 35.92919921875, 37.37109375, 38.81298828125, 40.2548828125, 41.69677734375, 43.138671875, 44.58056640625, 46.0224609375, 47.46435546875, 48.90625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 7.0, 2.0, 9.0, 10.0, 7.0, 11.0, 11.0, 18.0, 19.0, 19.0, 23.0, 29.0, 26.0, 35.0, 25.0, 50.0, 30.0, 34.0, 47.0, 40.0, 48.0, 52.0, 40.0, 45.0, 38.0, 39.0, 32.0, 23.0, 34.0, 22.0, 25.0, 22.0, 21.0, 21.0, 21.0, 9.0, 14.0, 12.0, 7.0, 5.0, 3.0, 6.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.1875, -36.87548828125, -35.5634765625, -34.25146484375, -32.939453125, -31.62744140625, -30.3154296875, -29.00341796875, -27.69140625, -26.37939453125, -25.0673828125, -23.75537109375, -22.443359375, -21.13134765625, -19.8193359375, -18.50732421875, -17.1953125, -15.88330078125, -14.5712890625, -13.25927734375, -11.947265625, -10.63525390625, -9.3232421875, -8.01123046875, -6.69921875, -5.38720703125, -4.0751953125, -2.76318359375, -1.451171875, -0.13916015625, 1.1728515625, 2.48486328125, 3.796875, 5.10888671875, 6.4208984375, 7.73291015625, 9.044921875, 10.35693359375, 11.6689453125, 12.98095703125, 14.29296875, 15.60498046875, 16.9169921875, 18.22900390625, 19.541015625, 20.85302734375, 22.1650390625, 23.47705078125, 24.7890625, 26.10107421875, 27.4130859375, 28.72509765625, 30.037109375, 31.34912109375, 32.6611328125, 33.97314453125, 35.28515625, 36.59716796875, 37.9091796875, 39.22119140625, 40.533203125, 41.84521484375, 43.1572265625, 44.46923828125, 45.78125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 8.0, 12.0, 12.0, 24.0, 33.0, 42.0, 48.0, 86.0, 145.0, 179.0, 296.0, 417.0, 632.0, 958.0, 1521.0, 2468.0, 4091.0, 6820.0, 11886.0, 20910.0, 39880.0, 89803.0, 274907.0, 372657.0, 114521.0, 48788.0, 24187.0, 13258.0, 7568.0, 4604.0, 2851.0, 1789.0, 1071.0, 713.0, 448.0, 290.0, 181.0, 131.0, 92.0, 62.0, 52.0, 32.0, 20.0, 11.0, 12.0, 13.0, 8.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-32.375, -31.30029296875, -30.2255859375, -29.15087890625, -28.076171875, -27.00146484375, -25.9267578125, -24.85205078125, -23.77734375, -22.70263671875, -21.6279296875, -20.55322265625, -19.478515625, -18.40380859375, -17.3291015625, -16.25439453125, -15.1796875, -14.10498046875, -13.0302734375, -11.95556640625, -10.880859375, -9.80615234375, -8.7314453125, -7.65673828125, -6.58203125, -5.50732421875, -4.4326171875, -3.35791015625, -2.283203125, -1.20849609375, -0.1337890625, 0.94091796875, 2.015625, 3.09033203125, 4.1650390625, 5.23974609375, 6.314453125, 7.38916015625, 8.4638671875, 9.53857421875, 10.61328125, 11.68798828125, 12.7626953125, 13.83740234375, 14.912109375, 15.98681640625, 17.0615234375, 18.13623046875, 19.2109375, 20.28564453125, 21.3603515625, 22.43505859375, 23.509765625, 24.58447265625, 25.6591796875, 26.73388671875, 27.80859375, 28.88330078125, 29.9580078125, 31.03271484375, 32.107421875, 33.18212890625, 34.2568359375, 35.33154296875, 36.40625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 6.0, 5.0, 6.0, 6.0, 15.0, 9.0, 17.0, 16.0, 10.0, 19.0, 21.0, 25.0, 22.0, 20.0, 32.0, 34.0, 29.0, 44.0, 41.0, 41.0, 33.0, 41.0, 50.0, 38.0, 46.0, 35.0, 47.0, 35.0, 22.0, 32.0, 29.0, 20.0, 22.0, 21.0, 20.0, 18.0, 10.0, 6.0, 16.0, 4.0, 9.0, 7.0, 10.0, 5.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.125, -26.221435546875, -25.31787109375, -24.414306640625, -23.5107421875, -22.607177734375, -21.70361328125, -20.800048828125, -19.896484375, -18.992919921875, -18.08935546875, -17.185791015625, -16.2822265625, -15.378662109375, -14.47509765625, -13.571533203125, -12.66796875, -11.764404296875, -10.86083984375, -9.957275390625, -9.0537109375, -8.150146484375, -7.24658203125, -6.343017578125, -5.439453125, -4.535888671875, -3.63232421875, -2.728759765625, -1.8251953125, -0.921630859375, -0.01806640625, 0.885498046875, 1.7890625, 2.692626953125, 3.59619140625, 4.499755859375, 5.4033203125, 6.306884765625, 7.21044921875, 8.114013671875, 9.017578125, 9.921142578125, 10.82470703125, 11.728271484375, 12.6318359375, 13.535400390625, 14.43896484375, 15.342529296875, 16.24609375, 17.149658203125, 18.05322265625, 18.956787109375, 19.8603515625, 20.763916015625, 21.66748046875, 22.571044921875, 23.474609375, 24.378173828125, 25.28173828125, 26.185302734375, 27.0888671875, 27.992431640625, 28.89599609375, 29.799560546875, 30.703125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 6.0, 7.0, 5.0, 10.0, 24.0, 15.0, 44.0, 37.0, 74.0, 74.0, 96.0, 121.0, 186.0, 201.0, 304.0, 456.0, 638.0, 912.0, 1411.0, 2340.0, 4056.0, 7426.0, 16364.0, 46767.0, 264019.0, 587984.0, 70811.0, 22135.0, 9323.0, 4733.0, 2621.0, 1679.0, 1064.0, 729.0, 536.0, 373.0, 276.0, 181.0, 137.0, 88.0, 76.0, 53.0, 46.0, 33.0, 22.0, 16.0, 20.0, 7.0, 6.0, 4.0, 4.0, 7.0, 0.0, 0.0, 6.0, 0.0, 2.0], "bins": [-19.4375, -18.8330078125, -18.228515625, -17.6240234375, -17.01953125, -16.4150390625, -15.810546875, -15.2060546875, -14.6015625, -13.9970703125, -13.392578125, -12.7880859375, -12.18359375, -11.5791015625, -10.974609375, -10.3701171875, -9.765625, -9.1611328125, -8.556640625, -7.9521484375, -7.34765625, -6.7431640625, -6.138671875, -5.5341796875, -4.9296875, -4.3251953125, -3.720703125, -3.1162109375, -2.51171875, -1.9072265625, -1.302734375, -0.6982421875, -0.09375, 0.5107421875, 1.115234375, 1.7197265625, 2.32421875, 2.9287109375, 3.533203125, 4.1376953125, 4.7421875, 5.3466796875, 5.951171875, 6.5556640625, 7.16015625, 7.7646484375, 8.369140625, 8.9736328125, 9.578125, 10.1826171875, 10.787109375, 11.3916015625, 11.99609375, 12.6005859375, 13.205078125, 13.8095703125, 14.4140625, 15.0185546875, 15.623046875, 16.2275390625, 16.83203125, 17.4365234375, 18.041015625, 18.6455078125, 19.25]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 4.0, 0.0, 5.0, 4.0, 3.0, 5.0, 9.0, 6.0, 12.0, 12.0, 18.0, 16.0, 24.0, 28.0, 37.0, 26.0, 33.0, 41.0, 61.0, 68.0, 83.0, 79.0, 69.0, 57.0, 53.0, 43.0, 29.0, 35.0, 23.0, 19.0, 20.0, 18.0, 16.0, 16.0, 11.0, 5.0, 6.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002254486083984375, -0.0021804869174957275, -0.00210648775100708, -0.0020324885845184326, -0.001958489418029785, -0.0018844902515411377, -0.0018104910850524902, -0.0017364919185638428, -0.0016624927520751953, -0.0015884935855865479, -0.0015144944190979004, -0.001440495252609253, -0.0013664960861206055, -0.001292496919631958, -0.0012184977531433105, -0.001144498586654663, -0.0010704994201660156, -0.0009965002536773682, -0.0009225010871887207, -0.0008485019207000732, -0.0007745027542114258, -0.0007005035877227783, -0.0006265044212341309, -0.0005525052547454834, -0.00047850608825683594, -0.0004045069217681885, -0.000330507755279541, -0.00025650858879089355, -0.0001825094223022461, -0.00010851025581359863, -3.451108932495117e-05, 3.948807716369629e-05, 0.00011348724365234375, 0.0001874864101409912, 0.00026148557662963867, 0.00033548474311828613, 0.0004094839096069336, 0.00048348307609558105, 0.0005574822425842285, 0.000631481409072876, 0.0007054805755615234, 0.0007794797420501709, 0.0008534789085388184, 0.0009274780750274658, 0.0010014772415161133, 0.0010754764080047607, 0.0011494755744934082, 0.0012234747409820557, 0.0012974739074707031, 0.0013714730739593506, 0.001445472240447998, 0.0015194714069366455, 0.001593470573425293, 0.0016674697399139404, 0.0017414689064025879, 0.0018154680728912354, 0.0018894672393798828, 0.0019634664058685303, 0.0020374655723571777, 0.002111464738845825, 0.0021854639053344727, 0.00225946307182312, 0.0023334622383117676, 0.002407461404800415, 0.0024814605712890625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 1.0, 5.0, 8.0, 10.0, 14.0, 15.0, 26.0, 33.0, 37.0, 62.0, 101.0, 116.0, 165.0, 233.0, 341.0, 470.0, 713.0, 1094.0, 1512.0, 2435.0, 3896.0, 6549.0, 12559.0, 28816.0, 85667.0, 394635.0, 369335.0, 82165.0, 27742.0, 12313.0, 6500.0, 3745.0, 2359.0, 1525.0, 995.0, 698.0, 501.0, 317.0, 267.0, 168.0, 109.0, 91.0, 51.0, 46.0, 31.0, 32.0, 14.0, 13.0, 9.0, 7.0, 4.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-27.3125, -26.3701171875, -25.427734375, -24.4853515625, -23.54296875, -22.6005859375, -21.658203125, -20.7158203125, -19.7734375, -18.8310546875, -17.888671875, -16.9462890625, -16.00390625, -15.0615234375, -14.119140625, -13.1767578125, -12.234375, -11.2919921875, -10.349609375, -9.4072265625, -8.46484375, -7.5224609375, -6.580078125, -5.6376953125, -4.6953125, -3.7529296875, -2.810546875, -1.8681640625, -0.92578125, 0.0166015625, 0.958984375, 1.9013671875, 2.84375, 3.7861328125, 4.728515625, 5.6708984375, 6.61328125, 7.5556640625, 8.498046875, 9.4404296875, 10.3828125, 11.3251953125, 12.267578125, 13.2099609375, 14.15234375, 15.0947265625, 16.037109375, 16.9794921875, 17.921875, 18.8642578125, 19.806640625, 20.7490234375, 21.69140625, 22.6337890625, 23.576171875, 24.5185546875, 25.4609375, 26.4033203125, 27.345703125, 28.2880859375, 29.23046875, 30.1728515625, 31.115234375, 32.0576171875, 33.0]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 1.0, 4.0, 8.0, 2.0, 1.0, 4.0, 7.0, 8.0, 6.0, 18.0, 21.0, 29.0, 55.0, 86.0, 112.0, 162.0, 140.0, 112.0, 66.0, 43.0, 25.0, 13.0, 19.0, 9.0, 15.0, 4.0, 7.0, 4.0, 4.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.1953125, -9.91015625, -9.625, -9.33984375, -9.0546875, -8.76953125, -8.484375, -8.19921875, -7.9140625, -7.62890625, -7.34375, -7.05859375, -6.7734375, -6.48828125, -6.203125, -5.91796875, -5.6328125, -5.34765625, -5.0625, -4.77734375, -4.4921875, -4.20703125, -3.921875, -3.63671875, -3.3515625, -3.06640625, -2.78125, -2.49609375, -2.2109375, -1.92578125, -1.640625, -1.35546875, -1.0703125, -0.78515625, -0.5, -0.21484375, 0.0703125, 0.35546875, 0.640625, 0.92578125, 1.2109375, 1.49609375, 1.78125, 2.06640625, 2.3515625, 2.63671875, 2.921875, 3.20703125, 3.4921875, 3.77734375, 4.0625, 4.34765625, 4.6328125, 4.91796875, 5.203125, 5.48828125, 5.7734375, 6.05859375, 6.34375, 6.62890625, 6.9140625, 7.19921875, 7.484375, 7.76953125, 8.0546875]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 5.0, 8.0, 10.0, 23.0, 9.0, 22.0, 37.0, 35.0, 57.0, 56.0, 68.0, 80.0, 71.0, 83.0, 74.0, 70.0, 52.0, 38.0, 38.0, 33.0, 36.0, 12.0, 14.0, 12.0, 18.0, 9.0, 6.0, 3.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-61.19804000854492, -59.35976791381836, -57.5214958190918, -55.683223724365234, -53.84495162963867, -52.00667953491211, -50.16840362548828, -48.33013153076172, -46.491859436035156, -44.653587341308594, -42.81531524658203, -40.97704315185547, -39.138771057128906, -37.300498962402344, -35.46222686767578, -33.62395477294922, -31.785682678222656, -29.947410583496094, -28.10913848876953, -26.27086639404297, -24.432594299316406, -22.594322204589844, -20.75604820251465, -18.917776107788086, -17.079504013061523, -15.241231918334961, -13.402959823608398, -11.56468677520752, -9.726414680480957, -7.8881425857543945, -6.049869537353516, -4.211597442626953, -2.373321533203125, -0.5350492000579834, 1.3032231330871582, 3.141495704650879, 4.979767799377441, 6.818039894104004, 8.656312942504883, 10.494585037231445, 12.332857131958008, 14.17112922668457, 16.009401321411133, 17.847675323486328, 19.68594741821289, 21.524219512939453, 23.362491607666016, 25.200763702392578, 27.03903579711914, 28.877307891845703, 30.715579986572266, 32.55385208129883, 34.39212417602539, 36.23039627075195, 38.06867218017578, 39.906944274902344, 41.745216369628906, 43.58348846435547, 45.42176055908203, 47.260032653808594, 49.098304748535156, 50.93657684326172, 52.77484893798828, 54.613121032714844, 56.451393127441406]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 8.0, 5.0, 8.0, 9.0, 15.0, 13.0, 16.0, 17.0, 28.0, 21.0, 26.0, 27.0, 32.0, 32.0, 34.0, 43.0, 42.0, 39.0, 36.0, 31.0, 45.0, 48.0, 45.0, 31.0, 33.0, 34.0, 40.0, 33.0, 26.0, 18.0, 17.0, 20.0, 25.0, 17.0, 12.0, 17.0, 16.0, 6.0, 8.0, 7.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.28730392456055, -33.02607727050781, -31.76485252380371, -30.50362777709961, -29.242403030395508, -27.981178283691406, -26.719951629638672, -25.45872688293457, -24.19750213623047, -22.936277389526367, -21.675050735473633, -20.41382598876953, -19.15260124206543, -17.891376495361328, -16.630149841308594, -15.368925094604492, -14.107698440551758, -12.84647274017334, -11.585247993469238, -10.32402229309082, -9.062797546386719, -7.801571846008301, -6.540346145629883, -5.279121398925781, -4.017895698547363, -2.7566704750061035, -1.4954450130462646, -0.23421955108642578, 1.027005672454834, 2.2882308959960938, 3.5494565963745117, 4.810681343078613, 6.071907043457031, 7.333132266998291, 8.59435749053955, 9.855583190917969, 11.11680793762207, 12.378033638000488, 13.639259338378906, 14.900484085083008, 16.16170883178711, 17.42293357849121, 18.684160232543945, 19.945384979248047, 21.20660972595215, 22.46783447265625, 23.729061126708984, 24.990285873413086, 26.25151252746582, 27.512737274169922, 28.773963928222656, 30.035188674926758, 31.29641342163086, 32.557640075683594, 33.81886291503906, 35.0800895690918, 36.34131622314453, 37.602542877197266, 38.863765716552734, 40.12499237060547, 41.3862190246582, 42.64744186401367, 43.908668518066406, 45.169891357421875, 46.43111801147461]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 9.0, 6.0, 19.0, 16.0, 30.0, 44.0, 69.0, 106.0, 151.0, 205.0, 386.0, 568.0, 915.0, 1442.0, 2298.0, 3475.0, 5836.0, 9290.0, 14969.0, 24401.0, 40392.0, 67260.0, 113540.0, 179579.0, 205995.0, 149264.0, 90274.0, 53710.0, 32347.0, 19749.0, 12078.0, 7506.0, 4759.0, 2822.0, 1828.0, 1141.0, 735.0, 448.0, 316.0, 213.0, 115.0, 87.0, 46.0, 30.0, 27.0, 17.0, 10.0, 7.0, 11.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-65.0, -62.986328125, -60.97265625, -58.958984375, -56.9453125, -54.931640625, -52.91796875, -50.904296875, -48.890625, -46.876953125, -44.86328125, -42.849609375, -40.8359375, -38.822265625, -36.80859375, -34.794921875, -32.78125, -30.767578125, -28.75390625, -26.740234375, -24.7265625, -22.712890625, -20.69921875, -18.685546875, -16.671875, -14.658203125, -12.64453125, -10.630859375, -8.6171875, -6.603515625, -4.58984375, -2.576171875, -0.5625, 1.451171875, 3.46484375, 5.478515625, 7.4921875, 9.505859375, 11.51953125, 13.533203125, 15.546875, 17.560546875, 19.57421875, 21.587890625, 23.6015625, 25.615234375, 27.62890625, 29.642578125, 31.65625, 33.669921875, 35.68359375, 37.697265625, 39.7109375, 41.724609375, 43.73828125, 45.751953125, 47.765625, 49.779296875, 51.79296875, 53.806640625, 55.8203125, 57.833984375, 59.84765625, 61.861328125, 63.875]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 9.0, 8.0, 9.0, 10.0, 14.0, 26.0, 24.0, 27.0, 31.0, 29.0, 32.0, 28.0, 37.0, 44.0, 32.0, 46.0, 41.0, 45.0, 50.0, 43.0, 46.0, 42.0, 38.0, 32.0, 40.0, 33.0, 29.0, 24.0, 25.0, 15.0, 22.0, 18.0, 15.0, 9.0, 9.0, 5.0, 2.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.109375, -29.963134765625, -28.81689453125, -27.670654296875, -26.5244140625, -25.378173828125, -24.23193359375, -23.085693359375, -21.939453125, -20.793212890625, -19.64697265625, -18.500732421875, -17.3544921875, -16.208251953125, -15.06201171875, -13.915771484375, -12.76953125, -11.623291015625, -10.47705078125, -9.330810546875, -8.1845703125, -7.038330078125, -5.89208984375, -4.745849609375, -3.599609375, -2.453369140625, -1.30712890625, -0.160888671875, 0.9853515625, 2.131591796875, 3.27783203125, 4.424072265625, 5.5703125, 6.716552734375, 7.86279296875, 9.009033203125, 10.1552734375, 11.301513671875, 12.44775390625, 13.593994140625, 14.740234375, 15.886474609375, 17.03271484375, 18.178955078125, 19.3251953125, 20.471435546875, 21.61767578125, 22.763916015625, 23.91015625, 25.056396484375, 26.20263671875, 27.348876953125, 28.4951171875, 29.641357421875, 30.78759765625, 31.933837890625, 33.080078125, 34.226318359375, 35.37255859375, 36.518798828125, 37.6650390625, 38.811279296875, 39.95751953125, 41.103759765625, 42.25]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 11.0, 13.0, 15.0, 15.0, 31.0, 66.0, 86.0, 102.0, 168.0, 225.0, 346.0, 456.0, 677.0, 1003.0, 1446.0, 2129.0, 3133.0, 4675.0, 7107.0, 10634.0, 16178.0, 25354.0, 40073.0, 64082.0, 100902.0, 150425.0, 183112.0, 152041.0, 102619.0, 65092.0, 40885.0, 26107.0, 16479.0, 10773.0, 7199.0, 4723.0, 3252.0, 2133.0, 1478.0, 1053.0, 644.0, 494.0, 382.0, 239.0, 165.0, 120.0, 71.0, 52.0, 42.0, 20.0, 14.0, 6.0, 2.0, 6.0, 4.0, 3.0, 0.0, 1.0], "bins": [-51.71875, -50.12841796875, -48.5380859375, -46.94775390625, -45.357421875, -43.76708984375, -42.1767578125, -40.58642578125, -38.99609375, -37.40576171875, -35.8154296875, -34.22509765625, -32.634765625, -31.04443359375, -29.4541015625, -27.86376953125, -26.2734375, -24.68310546875, -23.0927734375, -21.50244140625, -19.912109375, -18.32177734375, -16.7314453125, -15.14111328125, -13.55078125, -11.96044921875, -10.3701171875, -8.77978515625, -7.189453125, -5.59912109375, -4.0087890625, -2.41845703125, -0.828125, 0.76220703125, 2.3525390625, 3.94287109375, 5.533203125, 7.12353515625, 8.7138671875, 10.30419921875, 11.89453125, 13.48486328125, 15.0751953125, 16.66552734375, 18.255859375, 19.84619140625, 21.4365234375, 23.02685546875, 24.6171875, 26.20751953125, 27.7978515625, 29.38818359375, 30.978515625, 32.56884765625, 34.1591796875, 35.74951171875, 37.33984375, 38.93017578125, 40.5205078125, 42.11083984375, 43.701171875, 45.29150390625, 46.8818359375, 48.47216796875, 50.0625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 5.0, 5.0, 5.0, 7.0, 9.0, 13.0, 9.0, 13.0, 23.0, 20.0, 27.0, 27.0, 29.0, 27.0, 35.0, 26.0, 44.0, 37.0, 27.0, 35.0, 25.0, 44.0, 36.0, 52.0, 29.0, 37.0, 29.0, 22.0, 41.0, 30.0, 37.0, 17.0, 16.0, 20.0, 19.0, 26.0, 16.0, 10.0, 7.0, 9.0, 6.0, 8.0, 8.0, 9.0, 6.0, 3.0, 2.0, 7.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-22.65625, -21.94482421875, -21.2333984375, -20.52197265625, -19.810546875, -19.09912109375, -18.3876953125, -17.67626953125, -16.96484375, -16.25341796875, -15.5419921875, -14.83056640625, -14.119140625, -13.40771484375, -12.6962890625, -11.98486328125, -11.2734375, -10.56201171875, -9.8505859375, -9.13916015625, -8.427734375, -7.71630859375, -7.0048828125, -6.29345703125, -5.58203125, -4.87060546875, -4.1591796875, -3.44775390625, -2.736328125, -2.02490234375, -1.3134765625, -0.60205078125, 0.109375, 0.82080078125, 1.5322265625, 2.24365234375, 2.955078125, 3.66650390625, 4.3779296875, 5.08935546875, 5.80078125, 6.51220703125, 7.2236328125, 7.93505859375, 8.646484375, 9.35791015625, 10.0693359375, 10.78076171875, 11.4921875, 12.20361328125, 12.9150390625, 13.62646484375, 14.337890625, 15.04931640625, 15.7607421875, 16.47216796875, 17.18359375, 17.89501953125, 18.6064453125, 19.31787109375, 20.029296875, 20.74072265625, 21.4521484375, 22.16357421875, 22.875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 6.0, 7.0, 8.0, 8.0, 11.0, 19.0, 22.0, 30.0, 51.0, 61.0, 64.0, 121.0, 185.0, 214.0, 319.0, 446.0, 677.0, 909.0, 1388.0, 2012.0, 3498.0, 7112.0, 19920.0, 83834.0, 714691.0, 161998.0, 29808.0, 9436.0, 4224.0, 2445.0, 1511.0, 1068.0, 705.0, 505.0, 352.0, 253.0, 202.0, 124.0, 82.0, 63.0, 42.0, 37.0, 22.0, 22.0, 23.0, 6.0, 5.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-154.375, -148.98828125, -143.6015625, -138.21484375, -132.828125, -127.44140625, -122.0546875, -116.66796875, -111.28125, -105.89453125, -100.5078125, -95.12109375, -89.734375, -84.34765625, -78.9609375, -73.57421875, -68.1875, -62.80078125, -57.4140625, -52.02734375, -46.640625, -41.25390625, -35.8671875, -30.48046875, -25.09375, -19.70703125, -14.3203125, -8.93359375, -3.546875, 1.83984375, 7.2265625, 12.61328125, 18.0, 23.38671875, 28.7734375, 34.16015625, 39.546875, 44.93359375, 50.3203125, 55.70703125, 61.09375, 66.48046875, 71.8671875, 77.25390625, 82.640625, 88.02734375, 93.4140625, 98.80078125, 104.1875, 109.57421875, 114.9609375, 120.34765625, 125.734375, 131.12109375, 136.5078125, 141.89453125, 147.28125, 152.66796875, 158.0546875, 163.44140625, 168.828125, 174.21484375, 179.6015625, 184.98828125, 190.375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 3.0, 5.0, 3.0, 1.0, 13.0, 10.0, 26.0, 25.0, 45.0, 76.0, 138.0, 203.0, 177.0, 129.0, 64.0, 39.0, 21.0, 8.0, 2.0, 4.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0098876953125, -0.00963902473449707, -0.00939035415649414, -0.009141683578491211, -0.008893013000488281, -0.008644342422485352, -0.008395671844482422, -0.008147001266479492, -0.007898330688476562, -0.007649660110473633, -0.007400989532470703, -0.0071523189544677734, -0.006903648376464844, -0.006654977798461914, -0.006406307220458984, -0.006157636642456055, -0.005908966064453125, -0.005660295486450195, -0.005411624908447266, -0.005162954330444336, -0.004914283752441406, -0.0046656131744384766, -0.004416942596435547, -0.004168272018432617, -0.0039196014404296875, -0.003670930862426758, -0.003422260284423828, -0.0031735897064208984, -0.0029249191284179688, -0.002676248550415039, -0.0024275779724121094, -0.0021789073944091797, -0.00193023681640625, -0.0016815662384033203, -0.0014328956604003906, -0.001184225082397461, -0.0009355545043945312, -0.0006868839263916016, -0.0004382133483886719, -0.0001895427703857422, 5.91278076171875e-05, 0.0003077983856201172, 0.0005564689636230469, 0.0008051395416259766, 0.0010538101196289062, 0.001302480697631836, 0.0015511512756347656, 0.0017998218536376953, 0.002048492431640625, 0.0022971630096435547, 0.0025458335876464844, 0.002794504165649414, 0.0030431747436523438, 0.0032918453216552734, 0.003540515899658203, 0.003789186477661133, 0.0040378570556640625, 0.004286527633666992, 0.004535198211669922, 0.0047838687896728516, 0.005032539367675781, 0.005281209945678711, 0.005529880523681641, 0.00577855110168457, 0.0060272216796875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 4.0, 9.0, 8.0, 22.0, 17.0, 35.0, 38.0, 55.0, 81.0, 122.0, 188.0, 259.0, 335.0, 496.0, 759.0, 1104.0, 1807.0, 2908.0, 5771.0, 15587.0, 82554.0, 759312.0, 139815.0, 21055.0, 7044.0, 3419.0, 1916.0, 1191.0, 807.0, 540.0, 365.0, 259.0, 193.0, 121.0, 85.0, 70.0, 54.0, 51.0, 21.0, 19.0, 11.0, 11.0, 12.0, 6.0, 6.0, 4.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-184.0, -178.357421875, -172.71484375, -167.072265625, -161.4296875, -155.787109375, -150.14453125, -144.501953125, -138.859375, -133.216796875, -127.57421875, -121.931640625, -116.2890625, -110.646484375, -105.00390625, -99.361328125, -93.71875, -88.076171875, -82.43359375, -76.791015625, -71.1484375, -65.505859375, -59.86328125, -54.220703125, -48.578125, -42.935546875, -37.29296875, -31.650390625, -26.0078125, -20.365234375, -14.72265625, -9.080078125, -3.4375, 2.205078125, 7.84765625, 13.490234375, 19.1328125, 24.775390625, 30.41796875, 36.060546875, 41.703125, 47.345703125, 52.98828125, 58.630859375, 64.2734375, 69.916015625, 75.55859375, 81.201171875, 86.84375, 92.486328125, 98.12890625, 103.771484375, 109.4140625, 115.056640625, 120.69921875, 126.341796875, 131.984375, 137.626953125, 143.26953125, 148.912109375, 154.5546875, 160.197265625, 165.83984375, 171.482421875, 177.125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 7.0, 11.0, 25.0, 31.0, 49.0, 76.0, 121.0, 160.0, 153.0, 132.0, 97.0, 50.0, 19.0, 17.0, 11.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0], "bins": [-53.78125, -52.47412109375, -51.1669921875, -49.85986328125, -48.552734375, -47.24560546875, -45.9384765625, -44.63134765625, -43.32421875, -42.01708984375, -40.7099609375, -39.40283203125, -38.095703125, -36.78857421875, -35.4814453125, -34.17431640625, -32.8671875, -31.56005859375, -30.2529296875, -28.94580078125, -27.638671875, -26.33154296875, -25.0244140625, -23.71728515625, -22.41015625, -21.10302734375, -19.7958984375, -18.48876953125, -17.181640625, -15.87451171875, -14.5673828125, -13.26025390625, -11.953125, -10.64599609375, -9.3388671875, -8.03173828125, -6.724609375, -5.41748046875, -4.1103515625, -2.80322265625, -1.49609375, -0.18896484375, 1.1181640625, 2.42529296875, 3.732421875, 5.03955078125, 6.3466796875, 7.65380859375, 8.9609375, 10.26806640625, 11.5751953125, 12.88232421875, 14.189453125, 15.49658203125, 16.8037109375, 18.11083984375, 19.41796875, 20.72509765625, 22.0322265625, 23.33935546875, 24.646484375, 25.95361328125, 27.2607421875, 28.56787109375, 29.875]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 6.0, 9.0, 13.0, 17.0, 24.0, 34.0, 53.0, 50.0, 74.0, 84.0, 98.0, 82.0, 66.0, 68.0, 62.0, 44.0, 29.0, 30.0, 26.0, 22.0, 18.0, 13.0, 15.0, 12.0, 7.0, 9.0, 10.0, 3.0, 8.0, 2.0, 5.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-48.40274429321289, -46.63463592529297, -44.86652374267578, -43.09841537475586, -41.33030700683594, -39.56219482421875, -37.79408645629883, -36.025978088378906, -34.25786590576172, -32.4897575378418, -30.721647262573242, -28.953536987304688, -27.185428619384766, -25.41731834411621, -23.649208068847656, -21.881099700927734, -20.112991333007812, -18.344881057739258, -16.576772689819336, -14.808662414550781, -13.040553092956543, -11.272443771362305, -9.50433349609375, -7.736224174499512, -5.968114852905273, -4.200005531311035, -2.4318957328796387, -0.6637859344482422, 1.104323387145996, 2.8724327087402344, 4.640542984008789, 6.408652305603027, 8.176765441894531, 9.94487476348877, 11.712984085083008, 13.481094360351562, 15.2492036819458, 17.01731300354004, 18.785423278808594, 20.553531646728516, 22.32164192199707, 24.089752197265625, 25.857860565185547, 27.6259708404541, 29.394081115722656, 31.162189483642578, 32.9302978515625, 34.69841003417969, 36.46651840209961, 38.23462677001953, 40.00273895263672, 41.77084732055664, 43.53895568847656, 45.30706787109375, 47.07517623901367, 48.843284606933594, 50.61139678955078, 52.3795051574707, 54.14761734008789, 55.91572570800781, 57.683834075927734, 59.451942443847656, 61.220054626464844, 62.988162994384766, 64.75627136230469]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 2.0, 5.0, 11.0, 8.0, 12.0, 14.0, 18.0, 15.0, 14.0, 23.0, 26.0, 21.0, 20.0, 17.0, 31.0, 29.0, 32.0, 45.0, 41.0, 38.0, 52.0, 37.0, 36.0, 38.0, 41.0, 41.0, 32.0, 35.0, 38.0, 33.0, 27.0, 24.0, 19.0, 19.0, 15.0, 13.0, 9.0, 13.0, 11.0, 9.0, 8.0, 13.0, 3.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.464149475097656, -38.22455978393555, -36.98496627807617, -35.74537658691406, -34.50578308105469, -33.26619338989258, -32.0265998840332, -30.787010192871094, -29.54741859436035, -28.30782699584961, -27.068235397338867, -25.828643798828125, -24.589054107666016, -23.34946060180664, -22.10987091064453, -20.87027931213379, -19.630687713623047, -18.391096115112305, -17.151504516601562, -15.911913871765137, -14.672322273254395, -13.432730674743652, -12.193140029907227, -10.953548431396484, -9.713956832885742, -8.474365234375, -7.234774112701416, -5.995182991027832, -4.75559139251709, -3.5159997940063477, -2.2764086723327637, -1.0368175506591797, 0.20277023315429688, 1.44236159324646, 2.681952953338623, 3.921544313430786, 5.161135673522949, 6.400727272033691, 7.640318393707275, 8.87990951538086, 10.119501113891602, 11.359092712402344, 12.598684310913086, 13.838274955749512, 15.077866554260254, 16.317459106445312, 17.557048797607422, 18.796640396118164, 20.036231994628906, 21.27582359313965, 22.51541519165039, 23.755006790161133, 24.994598388671875, 26.234188079833984, 27.473779678344727, 28.71337127685547, 29.95296287536621, 31.192554473876953, 32.43214416503906, 33.67173767089844, 34.91132736206055, 36.15092086791992, 37.39051055908203, 38.630104064941406, 39.869693756103516]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 5.0, 18.0, 24.0, 34.0, 54.0, 63.0, 85.0, 134.0, 183.0, 294.0, 397.0, 572.0, 813.0, 1188.0, 1800.0, 2614.0, 3916.0, 5877.0, 8839.0, 13554.0, 20945.0, 33105.0, 53492.0, 90874.0, 164694.0, 362523.0, 978054.0, 1334840.0, 581553.0, 229708.0, 118127.0, 68003.0, 41593.0, 26108.0, 16619.0, 10855.0, 7174.0, 5058.0, 3233.0, 2277.0, 1602.0, 1043.0, 723.0, 515.0, 319.0, 257.0, 177.0, 121.0, 80.0, 39.0, 39.0, 29.0, 15.0, 12.0, 6.0, 10.0, 4.0, 2.0], "bins": [-41.03125, -39.796875, -38.5625, -37.328125, -36.09375, -34.859375, -33.625, -32.390625, -31.15625, -29.921875, -28.6875, -27.453125, -26.21875, -24.984375, -23.75, -22.515625, -21.28125, -20.046875, -18.8125, -17.578125, -16.34375, -15.109375, -13.875, -12.640625, -11.40625, -10.171875, -8.9375, -7.703125, -6.46875, -5.234375, -4.0, -2.765625, -1.53125, -0.296875, 0.9375, 2.171875, 3.40625, 4.640625, 5.875, 7.109375, 8.34375, 9.578125, 10.8125, 12.046875, 13.28125, 14.515625, 15.75, 16.984375, 18.21875, 19.453125, 20.6875, 21.921875, 23.15625, 24.390625, 25.625, 26.859375, 28.09375, 29.328125, 30.5625, 31.796875, 33.03125, 34.265625, 35.5, 36.734375, 37.96875]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 5.0, 3.0, 5.0, 9.0, 15.0, 10.0, 8.0, 11.0, 16.0, 15.0, 22.0, 32.0, 24.0, 26.0, 37.0, 24.0, 39.0, 42.0, 32.0, 39.0, 41.0, 33.0, 44.0, 47.0, 37.0, 49.0, 32.0, 33.0, 41.0, 29.0, 33.0, 26.0, 19.0, 14.0, 14.0, 13.0, 10.0, 7.0, 20.0, 9.0, 14.0, 4.0, 5.0, 5.0, 4.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.671875, -20.023193359375, -19.37451171875, -18.725830078125, -18.0771484375, -17.428466796875, -16.77978515625, -16.131103515625, -15.482421875, -14.833740234375, -14.18505859375, -13.536376953125, -12.8876953125, -12.239013671875, -11.59033203125, -10.941650390625, -10.29296875, -9.644287109375, -8.99560546875, -8.346923828125, -7.6982421875, -7.049560546875, -6.40087890625, -5.752197265625, -5.103515625, -4.454833984375, -3.80615234375, -3.157470703125, -2.5087890625, -1.860107421875, -1.21142578125, -0.562744140625, 0.0859375, 0.734619140625, 1.38330078125, 2.031982421875, 2.6806640625, 3.329345703125, 3.97802734375, 4.626708984375, 5.275390625, 5.924072265625, 6.57275390625, 7.221435546875, 7.8701171875, 8.518798828125, 9.16748046875, 9.816162109375, 10.46484375, 11.113525390625, 11.76220703125, 12.410888671875, 13.0595703125, 13.708251953125, 14.35693359375, 15.005615234375, 15.654296875, 16.302978515625, 16.95166015625, 17.600341796875, 18.2490234375, 18.897705078125, 19.54638671875, 20.195068359375, 20.84375]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 6.0, 13.0, 12.0, 16.0, 37.0, 61.0, 62.0, 90.0, 152.0, 195.0, 274.0, 395.0, 525.0, 773.0, 1031.0, 1634.0, 2333.0, 3585.0, 5466.0, 8249.0, 13484.0, 22242.0, 37916.0, 68119.0, 125840.0, 248477.0, 527236.0, 1180005.0, 1020498.0, 448306.0, 216098.0, 110989.0, 60451.0, 34188.0, 20325.0, 12254.0, 7716.0, 5038.0, 3176.0, 2186.0, 1474.0, 974.0, 725.0, 499.0, 361.0, 252.0, 175.0, 109.0, 91.0, 64.0, 32.0, 40.0, 20.0, 13.0, 5.0, 3.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.703125, -30.642822265625, -29.58251953125, -28.522216796875, -27.4619140625, -26.401611328125, -25.34130859375, -24.281005859375, -23.220703125, -22.160400390625, -21.10009765625, -20.039794921875, -18.9794921875, -17.919189453125, -16.85888671875, -15.798583984375, -14.73828125, -13.677978515625, -12.61767578125, -11.557373046875, -10.4970703125, -9.436767578125, -8.37646484375, -7.316162109375, -6.255859375, -5.195556640625, -4.13525390625, -3.074951171875, -2.0146484375, -0.954345703125, 0.10595703125, 1.166259765625, 2.2265625, 3.286865234375, 4.34716796875, 5.407470703125, 6.4677734375, 7.528076171875, 8.58837890625, 9.648681640625, 10.708984375, 11.769287109375, 12.82958984375, 13.889892578125, 14.9501953125, 16.010498046875, 17.07080078125, 18.131103515625, 19.19140625, 20.251708984375, 21.31201171875, 22.372314453125, 23.4326171875, 24.492919921875, 25.55322265625, 26.613525390625, 27.673828125, 28.734130859375, 29.79443359375, 30.854736328125, 31.9150390625, 32.975341796875, 34.03564453125, 35.095947265625, 36.15625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 7.0, 7.0, 7.0, 12.0, 15.0, 11.0, 16.0, 24.0, 19.0, 42.0, 41.0, 46.0, 71.0, 72.0, 80.0, 94.0, 115.0, 155.0, 167.0, 197.0, 230.0, 276.0, 283.0, 305.0, 269.0, 236.0, 212.0, 175.0, 170.0, 118.0, 99.0, 88.0, 71.0, 65.0, 48.0, 36.0, 29.0, 33.0, 17.0, 23.0, 20.0, 16.0, 12.0, 9.0, 7.0, 7.0, 5.0, 2.0, 2.0, 4.0, 4.0, 3.0, 0.0, 3.0, 3.0, 1.0, 3.0], "bins": [-9.6015625, -9.2852783203125, -8.968994140625, -8.6527099609375, -8.33642578125, -8.0201416015625, -7.703857421875, -7.3875732421875, -7.0712890625, -6.7550048828125, -6.438720703125, -6.1224365234375, -5.80615234375, -5.4898681640625, -5.173583984375, -4.8572998046875, -4.541015625, -4.2247314453125, -3.908447265625, -3.5921630859375, -3.27587890625, -2.9595947265625, -2.643310546875, -2.3270263671875, -2.0107421875, -1.6944580078125, -1.378173828125, -1.0618896484375, -0.74560546875, -0.4293212890625, -0.113037109375, 0.2032470703125, 0.51953125, 0.8358154296875, 1.152099609375, 1.4683837890625, 1.78466796875, 2.1009521484375, 2.417236328125, 2.7335205078125, 3.0498046875, 3.3660888671875, 3.682373046875, 3.9986572265625, 4.31494140625, 4.6312255859375, 4.947509765625, 5.2637939453125, 5.580078125, 5.8963623046875, 6.212646484375, 6.5289306640625, 6.84521484375, 7.1614990234375, 7.477783203125, 7.7940673828125, 8.1103515625, 8.4266357421875, 8.742919921875, 9.0592041015625, 9.37548828125, 9.6917724609375, 10.008056640625, 10.3243408203125, 10.640625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 8.0, 15.0, 17.0, 26.0, 23.0, 33.0, 26.0, 48.0, 83.0, 89.0, 99.0, 95.0, 83.0, 84.0, 62.0, 60.0, 33.0, 25.0, 14.0, 13.0, 13.0, 15.0, 5.0, 7.0, 3.0, 5.0, 2.0, 3.0, 7.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.58049964904785, -28.358970642089844, -27.137439727783203, -25.915910720825195, -24.694381713867188, -23.472850799560547, -22.25132179260254, -21.02979278564453, -19.80826187133789, -18.586732864379883, -17.365201950073242, -16.143672943115234, -14.92214298248291, -13.700613021850586, -12.479084014892578, -11.257554054260254, -10.03602409362793, -8.814494132995605, -7.5929646492004395, -6.371435165405273, -5.149905204772949, -3.928375244140625, -2.706845760345459, -1.485316276550293, -0.26378631591796875, 0.9577434062957764, 2.1792731285095215, 3.4008028507232666, 4.622332572937012, 5.843862533569336, 7.065392017364502, 8.286921501159668, 9.508453369140625, 10.72998332977295, 11.951513290405273, 13.173042297363281, 14.394572257995605, 15.61610221862793, 16.837631225585938, 18.059162139892578, 19.280691146850586, 20.502220153808594, 21.723751068115234, 22.945280075073242, 24.16680908203125, 25.38833999633789, 26.6098690032959, 27.831398010253906, 29.052928924560547, 30.274457931518555, 31.495988845825195, 32.7175178527832, 33.939048767089844, 35.16057586669922, 36.38210678100586, 37.6036376953125, 38.825164794921875, 40.046695709228516, 41.26822280883789, 42.48975372314453, 43.71128463745117, 44.93281555175781, 46.15434265136719, 47.37587356567383, 48.59740447998047]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 2.0, 3.0, 4.0, 8.0, 4.0, 7.0, 5.0, 13.0, 7.0, 8.0, 15.0, 20.0, 25.0, 32.0, 26.0, 21.0, 30.0, 20.0, 31.0, 30.0, 37.0, 32.0, 44.0, 38.0, 44.0, 36.0, 43.0, 46.0, 40.0, 29.0, 40.0, 35.0, 30.0, 23.0, 23.0, 19.0, 23.0, 13.0, 18.0, 16.0, 15.0, 5.0, 9.0, 11.0, 7.0, 10.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.365324020385742, -21.677663803100586, -20.99000358581543, -20.30234146118164, -19.614681243896484, -18.927021026611328, -18.239360809326172, -17.551700592041016, -16.864038467407227, -16.17637825012207, -15.488717079162598, -14.801056861877441, -14.113395690917969, -13.425735473632812, -12.738075256347656, -12.050414085388184, -11.362753868103027, -10.675093650817871, -9.987432479858398, -9.299772262573242, -8.61211109161377, -7.924450874328613, -7.236790180206299, -6.549129486083984, -5.86146879196167, -5.1738080978393555, -4.486147403717041, -3.7984869480133057, -3.110826253890991, -2.4231655597686768, -1.7355051040649414, -1.047844409942627, -0.3601837158203125, 0.3274769186973572, 1.0151375532150269, 1.7027981281280518, 2.390458822250366, 3.0781195163726807, 3.765779972076416, 4.4534406661987305, 5.141101360321045, 5.828762054443359, 6.516422748565674, 7.204083442687988, 7.8917436599731445, 8.579404830932617, 9.267065048217773, 9.95472526550293, 10.642386436462402, 11.330046653747559, 12.017707824707031, 12.705368041992188, 13.39302921295166, 14.080689430236816, 14.768350601196289, 15.456010818481445, 16.1436710357666, 16.831331253051758, 17.518991470336914, 18.206653594970703, 18.89431381225586, 19.581974029541016, 20.269634246826172, 20.957294464111328, 21.644956588745117]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 4.0, 7.0, 9.0, 15.0, 14.0, 29.0, 37.0, 64.0, 91.0, 144.0, 206.0, 301.0, 439.0, 681.0, 1088.0, 1755.0, 2856.0, 4484.0, 7641.0, 12877.0, 22133.0, 39563.0, 72069.0, 140838.0, 279679.0, 221087.0, 107395.0, 56871.0, 31140.0, 18261.0, 10266.0, 6266.0, 3852.0, 2327.0, 1499.0, 885.0, 549.0, 394.0, 234.0, 168.0, 128.0, 79.0, 55.0, 25.0, 16.0, 16.0, 8.0, 7.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-23.859375, -23.132080078125, -22.40478515625, -21.677490234375, -20.9501953125, -20.222900390625, -19.49560546875, -18.768310546875, -18.041015625, -17.313720703125, -16.58642578125, -15.859130859375, -15.1318359375, -14.404541015625, -13.67724609375, -12.949951171875, -12.22265625, -11.495361328125, -10.76806640625, -10.040771484375, -9.3134765625, -8.586181640625, -7.85888671875, -7.131591796875, -6.404296875, -5.677001953125, -4.94970703125, -4.222412109375, -3.4951171875, -2.767822265625, -2.04052734375, -1.313232421875, -0.5859375, 0.141357421875, 0.86865234375, 1.595947265625, 2.3232421875, 3.050537109375, 3.77783203125, 4.505126953125, 5.232421875, 5.959716796875, 6.68701171875, 7.414306640625, 8.1416015625, 8.868896484375, 9.59619140625, 10.323486328125, 11.05078125, 11.778076171875, 12.50537109375, 13.232666015625, 13.9599609375, 14.687255859375, 15.41455078125, 16.141845703125, 16.869140625, 17.596435546875, 18.32373046875, 19.051025390625, 19.7783203125, 20.505615234375, 21.23291015625, 21.960205078125, 22.6875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 7.0, 12.0, 10.0, 9.0, 14.0, 18.0, 23.0, 20.0, 23.0, 28.0, 24.0, 31.0, 37.0, 38.0, 39.0, 31.0, 52.0, 47.0, 47.0, 30.0, 52.0, 41.0, 35.0, 40.0, 35.0, 35.0, 30.0, 34.0, 35.0, 17.0, 12.0, 12.0, 12.0, 13.0, 10.0, 8.0, 6.0, 8.0, 5.0, 5.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.0, -22.29052734375, -21.5810546875, -20.87158203125, -20.162109375, -19.45263671875, -18.7431640625, -18.03369140625, -17.32421875, -16.61474609375, -15.9052734375, -15.19580078125, -14.486328125, -13.77685546875, -13.0673828125, -12.35791015625, -11.6484375, -10.93896484375, -10.2294921875, -9.52001953125, -8.810546875, -8.10107421875, -7.3916015625, -6.68212890625, -5.97265625, -5.26318359375, -4.5537109375, -3.84423828125, -3.134765625, -2.42529296875, -1.7158203125, -1.00634765625, -0.296875, 0.41259765625, 1.1220703125, 1.83154296875, 2.541015625, 3.25048828125, 3.9599609375, 4.66943359375, 5.37890625, 6.08837890625, 6.7978515625, 7.50732421875, 8.216796875, 8.92626953125, 9.6357421875, 10.34521484375, 11.0546875, 11.76416015625, 12.4736328125, 13.18310546875, 13.892578125, 14.60205078125, 15.3115234375, 16.02099609375, 16.73046875, 17.43994140625, 18.1494140625, 18.85888671875, 19.568359375, 20.27783203125, 20.9873046875, 21.69677734375, 22.40625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 8.0, 9.0, 10.0, 19.0, 25.0, 26.0, 41.0, 55.0, 88.0, 138.0, 158.0, 284.0, 436.0, 716.0, 1125.0, 1926.0, 3354.0, 5479.0, 9631.0, 17664.0, 35135.0, 81167.0, 266413.0, 413254.0, 115117.0, 45899.0, 21867.0, 11617.0, 6848.0, 3879.0, 2386.0, 1405.0, 897.0, 499.0, 301.0, 234.0, 121.0, 98.0, 55.0, 47.0, 48.0, 29.0, 11.0, 14.0, 9.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-22.4375, -21.69384765625, -20.9501953125, -20.20654296875, -19.462890625, -18.71923828125, -17.9755859375, -17.23193359375, -16.48828125, -15.74462890625, -15.0009765625, -14.25732421875, -13.513671875, -12.77001953125, -12.0263671875, -11.28271484375, -10.5390625, -9.79541015625, -9.0517578125, -8.30810546875, -7.564453125, -6.82080078125, -6.0771484375, -5.33349609375, -4.58984375, -3.84619140625, -3.1025390625, -2.35888671875, -1.615234375, -0.87158203125, -0.1279296875, 0.61572265625, 1.359375, 2.10302734375, 2.8466796875, 3.59033203125, 4.333984375, 5.07763671875, 5.8212890625, 6.56494140625, 7.30859375, 8.05224609375, 8.7958984375, 9.53955078125, 10.283203125, 11.02685546875, 11.7705078125, 12.51416015625, 13.2578125, 14.00146484375, 14.7451171875, 15.48876953125, 16.232421875, 16.97607421875, 17.7197265625, 18.46337890625, 19.20703125, 19.95068359375, 20.6943359375, 21.43798828125, 22.181640625, 22.92529296875, 23.6689453125, 24.41259765625, 25.15625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 7.0, 5.0, 4.0, 8.0, 12.0, 17.0, 14.0, 19.0, 20.0, 31.0, 30.0, 22.0, 43.0, 26.0, 37.0, 35.0, 40.0, 30.0, 47.0, 38.0, 41.0, 47.0, 57.0, 37.0, 40.0, 38.0, 31.0, 32.0, 30.0, 29.0, 17.0, 17.0, 26.0, 19.0, 14.0, 12.0, 10.0, 5.0, 5.0, 5.0, 1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.53125, -15.036865234375, -14.54248046875, -14.048095703125, -13.5537109375, -13.059326171875, -12.56494140625, -12.070556640625, -11.576171875, -11.081787109375, -10.58740234375, -10.093017578125, -9.5986328125, -9.104248046875, -8.60986328125, -8.115478515625, -7.62109375, -7.126708984375, -6.63232421875, -6.137939453125, -5.6435546875, -5.149169921875, -4.65478515625, -4.160400390625, -3.666015625, -3.171630859375, -2.67724609375, -2.182861328125, -1.6884765625, -1.194091796875, -0.69970703125, -0.205322265625, 0.2890625, 0.783447265625, 1.27783203125, 1.772216796875, 2.2666015625, 2.760986328125, 3.25537109375, 3.749755859375, 4.244140625, 4.738525390625, 5.23291015625, 5.727294921875, 6.2216796875, 6.716064453125, 7.21044921875, 7.704833984375, 8.19921875, 8.693603515625, 9.18798828125, 9.682373046875, 10.1767578125, 10.671142578125, 11.16552734375, 11.659912109375, 12.154296875, 12.648681640625, 13.14306640625, 13.637451171875, 14.1318359375, 14.626220703125, 15.12060546875, 15.614990234375, 16.109375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 3.0, 8.0, 15.0, 10.0, 20.0, 25.0, 35.0, 35.0, 56.0, 67.0, 86.0, 95.0, 142.0, 197.0, 320.0, 493.0, 820.0, 1231.0, 2487.0, 5169.0, 12011.0, 32526.0, 114763.0, 620446.0, 184428.0, 43908.0, 15435.0, 6592.0, 2893.0, 1616.0, 849.0, 535.0, 331.0, 230.0, 175.0, 110.0, 93.0, 74.0, 43.0, 50.0, 26.0, 33.0, 18.0, 14.0, 10.0, 3.0, 7.0, 4.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0], "bins": [-5.3046875, -5.13702392578125, -4.9693603515625, -4.80169677734375, -4.634033203125, -4.46636962890625, -4.2987060546875, -4.13104248046875, -3.96337890625, -3.79571533203125, -3.6280517578125, -3.46038818359375, -3.292724609375, -3.12506103515625, -2.9573974609375, -2.78973388671875, -2.6220703125, -2.45440673828125, -2.2867431640625, -2.11907958984375, -1.951416015625, -1.78375244140625, -1.6160888671875, -1.44842529296875, -1.28076171875, -1.11309814453125, -0.9454345703125, -0.77777099609375, -0.610107421875, -0.44244384765625, -0.2747802734375, -0.10711669921875, 0.060546875, 0.22821044921875, 0.3958740234375, 0.56353759765625, 0.731201171875, 0.89886474609375, 1.0665283203125, 1.23419189453125, 1.40185546875, 1.56951904296875, 1.7371826171875, 1.90484619140625, 2.072509765625, 2.24017333984375, 2.4078369140625, 2.57550048828125, 2.7431640625, 2.91082763671875, 3.0784912109375, 3.24615478515625, 3.413818359375, 3.58148193359375, 3.7491455078125, 3.91680908203125, 4.08447265625, 4.25213623046875, 4.4197998046875, 4.58746337890625, 4.755126953125, 4.92279052734375, 5.0904541015625, 5.25811767578125, 5.42578125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 6.0, 8.0, 10.0, 4.0, 5.0, 10.0, 15.0, 17.0, 22.0, 31.0, 34.0, 36.0, 35.0, 55.0, 49.0, 76.0, 75.0, 67.0, 75.0, 52.0, 37.0, 46.0, 42.0, 30.0, 30.0, 28.0, 18.0, 8.0, 15.0, 12.0, 13.0, 11.0, 6.0, 5.0, 2.0, 3.0, 1.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00060272216796875, -0.0005806758999824524, -0.0005586296319961548, -0.0005365833640098572, -0.0005145370960235596, -0.000492490828037262, -0.00047044456005096436, -0.00044839829206466675, -0.00042635202407836914, -0.00040430575609207153, -0.0003822594881057739, -0.0003602132201194763, -0.0003381669521331787, -0.0003161206841468811, -0.0002940744161605835, -0.0002720281481742859, -0.0002499818801879883, -0.00022793561220169067, -0.00020588934421539307, -0.00018384307622909546, -0.00016179680824279785, -0.00013975054025650024, -0.00011770427227020264, -9.565800428390503e-05, -7.361173629760742e-05, -5.1565468311309814e-05, -2.9519200325012207e-05, -7.4729323387146e-06, 1.4573335647583008e-05, 3.6619603633880615e-05, 5.866587162017822e-05, 8.071213960647583e-05, 0.00010275840759277344, 0.00012480467557907104, 0.00014685094356536865, 0.00016889721155166626, 0.00019094347953796387, 0.00021298974752426147, 0.00023503601551055908, 0.0002570822834968567, 0.0002791285514831543, 0.0003011748194694519, 0.0003232210874557495, 0.0003452673554420471, 0.0003673136234283447, 0.00038935989141464233, 0.00041140615940093994, 0.00043345242738723755, 0.00045549869537353516, 0.00047754496335983276, 0.0004995912313461304, 0.000521637499332428, 0.0005436837673187256, 0.0005657300353050232, 0.0005877763032913208, 0.0006098225712776184, 0.000631868839263916, 0.0006539151072502136, 0.0006759613752365112, 0.0006980076432228088, 0.0007200539112091064, 0.000742100179195404, 0.0007641464471817017, 0.0007861927151679993, 0.0008082389831542969]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 8.0, 12.0, 12.0, 11.0, 33.0, 19.0, 41.0, 52.0, 72.0, 122.0, 240.0, 308.0, 574.0, 942.0, 1847.0, 3825.0, 8806.0, 23110.0, 69649.0, 277083.0, 495417.0, 109962.0, 33597.0, 12292.0, 5087.0, 2465.0, 1184.0, 673.0, 382.0, 243.0, 153.0, 108.0, 60.0, 47.0, 29.0, 26.0, 14.0, 14.0, 12.0, 8.0, 6.0, 2.0, 5.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.8515625, -9.525146484375, -9.19873046875, -8.872314453125, -8.5458984375, -8.219482421875, -7.89306640625, -7.566650390625, -7.240234375, -6.913818359375, -6.58740234375, -6.260986328125, -5.9345703125, -5.608154296875, -5.28173828125, -4.955322265625, -4.62890625, -4.302490234375, -3.97607421875, -3.649658203125, -3.3232421875, -2.996826171875, -2.67041015625, -2.343994140625, -2.017578125, -1.691162109375, -1.36474609375, -1.038330078125, -0.7119140625, -0.385498046875, -0.05908203125, 0.267333984375, 0.59375, 0.920166015625, 1.24658203125, 1.572998046875, 1.8994140625, 2.225830078125, 2.55224609375, 2.878662109375, 3.205078125, 3.531494140625, 3.85791015625, 4.184326171875, 4.5107421875, 4.837158203125, 5.16357421875, 5.489990234375, 5.81640625, 6.142822265625, 6.46923828125, 6.795654296875, 7.1220703125, 7.448486328125, 7.77490234375, 8.101318359375, 8.427734375, 8.754150390625, 9.08056640625, 9.406982421875, 9.7333984375, 10.059814453125, 10.38623046875, 10.712646484375, 11.0390625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 9.0, 11.0, 14.0, 22.0, 26.0, 51.0, 60.0, 86.0, 80.0, 109.0, 115.0, 88.0, 92.0, 78.0, 46.0, 38.0, 27.0, 10.0, 5.0, 11.0, 6.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7880859375, -1.7073822021484375, -1.626678466796875, -1.5459747314453125, -1.46527099609375, -1.3845672607421875, -1.303863525390625, -1.2231597900390625, -1.1424560546875, -1.0617523193359375, -0.981048583984375, -0.9003448486328125, -0.81964111328125, -0.7389373779296875, -0.658233642578125, -0.5775299072265625, -0.496826171875, -0.4161224365234375, -0.335418701171875, -0.2547149658203125, -0.17401123046875, -0.0933074951171875, -0.012603759765625, 0.0680999755859375, 0.1488037109375, 0.2295074462890625, 0.310211181640625, 0.3909149169921875, 0.47161865234375, 0.5523223876953125, 0.633026123046875, 0.7137298583984375, 0.79443359375, 0.8751373291015625, 0.955841064453125, 1.0365447998046875, 1.11724853515625, 1.1979522705078125, 1.278656005859375, 1.3593597412109375, 1.4400634765625, 1.5207672119140625, 1.601470947265625, 1.6821746826171875, 1.76287841796875, 1.8435821533203125, 1.924285888671875, 2.0049896240234375, 2.085693359375, 2.1663970947265625, 2.247100830078125, 2.3278045654296875, 2.40850830078125, 2.4892120361328125, 2.569915771484375, 2.6506195068359375, 2.7313232421875, 2.8120269775390625, 2.892730712890625, 2.9734344482421875, 3.05413818359375, 3.1348419189453125, 3.215545654296875, 3.2962493896484375, 3.376953125]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 8.0, 14.0, 13.0, 20.0, 13.0, 23.0, 33.0, 38.0, 62.0, 77.0, 82.0, 100.0, 103.0, 103.0, 69.0, 45.0, 43.0, 31.0, 19.0, 19.0, 19.0, 7.0, 11.0, 14.0, 6.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.768491744995117, -26.662609100341797, -25.55672836303711, -24.45084571838379, -23.34496307373047, -22.23908233642578, -21.13319969177246, -20.02731704711914, -18.921436309814453, -17.815553665161133, -16.709672927856445, -15.603790283203125, -14.497908592224121, -13.392026901245117, -12.286144256591797, -11.180262565612793, -10.074380874633789, -8.968499183654785, -7.862617015838623, -6.756734848022461, -5.650853157043457, -4.544971466064453, -3.439089298248291, -2.333207130432129, -1.227325439453125, -0.12144351005554199, 0.984438419342041, 2.090320348739624, 3.196202278137207, 4.302083969116211, 5.407966136932373, 6.513848304748535, 7.619728088378906, 8.72560977935791, 9.831491470336914, 10.937374114990234, 12.043255805969238, 13.149137496948242, 14.255020141601562, 15.360901832580566, 16.46678352355957, 17.57266616821289, 18.678546905517578, 19.7844295501709, 20.89031219482422, 21.996192932128906, 23.102075576782227, 24.207958221435547, 25.313838958740234, 26.419721603393555, 27.525602340698242, 28.631484985351562, 29.73736572265625, 30.84324836730957, 31.94913101196289, 33.05501174926758, 34.16089630126953, 35.26677703857422, 36.37266159057617, 37.47854232788086, 38.58442306518555, 39.6903076171875, 40.79618835449219, 41.902069091796875, 43.00794982910156]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 0.0, 5.0, 4.0, 7.0, 6.0, 8.0, 11.0, 5.0, 14.0, 11.0, 24.0, 26.0, 24.0, 33.0, 25.0, 27.0, 21.0, 33.0, 31.0, 37.0, 41.0, 43.0, 35.0, 41.0, 47.0, 52.0, 38.0, 38.0, 39.0, 40.0, 31.0, 21.0, 27.0, 19.0, 16.0, 21.0, 19.0, 11.0, 20.0, 8.0, 5.0, 14.0, 10.0, 6.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.92969512939453, -21.270925521850586, -20.612157821655273, -19.953388214111328, -19.294620513916016, -18.63585090637207, -17.977083206176758, -17.318313598632812, -16.6595458984375, -16.000776290893555, -15.342008590698242, -14.683239936828613, -14.024471282958984, -13.365701675415039, -12.70693302154541, -12.048164367675781, -11.389394760131836, -10.730626106262207, -10.071857452392578, -9.41308879852295, -8.75432014465332, -8.095550537109375, -7.436781883239746, -6.778013229370117, -6.119244575500488, -5.460475921630859, -4.8017072677612305, -4.142938137054443, -3.4841694831848145, -2.8254008293151855, -2.1666319370269775, -1.5078630447387695, -0.8490943908691406, -0.19032561779022217, 0.4684431552886963, 1.1272119283676147, 1.7859807014465332, 2.444749355316162, 3.10351824760437, 3.762287139892578, 4.421055793762207, 5.079824447631836, 5.738593101501465, 6.397362232208252, 7.056130886077881, 7.71489953994751, 8.373668670654297, 9.032437324523926, 9.691205978393555, 10.349974632263184, 11.008743286132812, 11.667511940002441, 12.32628059387207, 12.985050201416016, 13.643818855285645, 14.302587509155273, 14.961356163024902, 15.620124816894531, 16.278894424438477, 16.93766212463379, 17.596431732177734, 18.255199432373047, 18.913969039916992, 19.572738647460938, 20.23150634765625]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 11.0, 8.0, 14.0, 18.0, 26.0, 38.0, 65.0, 88.0, 127.0, 168.0, 264.0, 444.0, 613.0, 991.0, 1476.0, 2383.0, 3675.0, 5786.0, 9418.0, 14905.0, 24485.0, 39976.0, 66599.0, 110509.0, 170876.0, 199630.0, 152636.0, 95433.0, 56892.0, 34605.0, 21124.0, 12919.0, 8055.0, 5181.0, 3161.0, 2053.0, 1304.0, 870.0, 597.0, 381.0, 235.0, 161.0, 117.0, 93.0, 44.0, 36.0, 28.0, 12.0, 13.0, 6.0, 4.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-32.5, -31.42919921875, -30.3583984375, -29.28759765625, -28.216796875, -27.14599609375, -26.0751953125, -25.00439453125, -23.93359375, -22.86279296875, -21.7919921875, -20.72119140625, -19.650390625, -18.57958984375, -17.5087890625, -16.43798828125, -15.3671875, -14.29638671875, -13.2255859375, -12.15478515625, -11.083984375, -10.01318359375, -8.9423828125, -7.87158203125, -6.80078125, -5.72998046875, -4.6591796875, -3.58837890625, -2.517578125, -1.44677734375, -0.3759765625, 0.69482421875, 1.765625, 2.83642578125, 3.9072265625, 4.97802734375, 6.048828125, 7.11962890625, 8.1904296875, 9.26123046875, 10.33203125, 11.40283203125, 12.4736328125, 13.54443359375, 14.615234375, 15.68603515625, 16.7568359375, 17.82763671875, 18.8984375, 19.96923828125, 21.0400390625, 22.11083984375, 23.181640625, 24.25244140625, 25.3232421875, 26.39404296875, 27.46484375, 28.53564453125, 29.6064453125, 30.67724609375, 31.748046875, 32.81884765625, 33.8896484375, 34.96044921875, 36.03125]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 4.0, 5.0, 8.0, 2.0, 11.0, 6.0, 11.0, 7.0, 18.0, 16.0, 17.0, 16.0, 19.0, 31.0, 25.0, 32.0, 34.0, 26.0, 33.0, 27.0, 37.0, 40.0, 31.0, 36.0, 35.0, 41.0, 45.0, 38.0, 46.0, 31.0, 41.0, 33.0, 21.0, 20.0, 18.0, 19.0, 13.0, 17.0, 16.0, 16.0, 11.0, 7.0, 6.0, 10.0, 3.0, 6.0, 3.0, 3.0, 4.0, 4.0, 1.0, 1.0], "bins": [-18.34375, -17.8248291015625, -17.305908203125, -16.7869873046875, -16.26806640625, -15.7491455078125, -15.230224609375, -14.7113037109375, -14.1923828125, -13.6734619140625, -13.154541015625, -12.6356201171875, -12.11669921875, -11.5977783203125, -11.078857421875, -10.5599365234375, -10.041015625, -9.5220947265625, -9.003173828125, -8.4842529296875, -7.96533203125, -7.4464111328125, -6.927490234375, -6.4085693359375, -5.8896484375, -5.3707275390625, -4.851806640625, -4.3328857421875, -3.81396484375, -3.2950439453125, -2.776123046875, -2.2572021484375, -1.73828125, -1.2193603515625, -0.700439453125, -0.1815185546875, 0.33740234375, 0.8563232421875, 1.375244140625, 1.8941650390625, 2.4130859375, 2.9320068359375, 3.450927734375, 3.9698486328125, 4.48876953125, 5.0076904296875, 5.526611328125, 6.0455322265625, 6.564453125, 7.0833740234375, 7.602294921875, 8.1212158203125, 8.64013671875, 9.1590576171875, 9.677978515625, 10.1968994140625, 10.7158203125, 11.2347412109375, 11.753662109375, 12.2725830078125, 12.79150390625, 13.3104248046875, 13.829345703125, 14.3482666015625, 14.8671875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 12.0, 13.0, 21.0, 20.0, 55.0, 70.0, 83.0, 147.0, 210.0, 374.0, 561.0, 818.0, 1325.0, 2190.0, 3447.0, 5456.0, 8858.0, 15056.0, 24987.0, 43704.0, 77056.0, 139323.0, 225610.0, 211531.0, 123446.0, 68318.0, 38476.0, 22455.0, 13370.0, 7911.0, 5123.0, 3033.0, 1925.0, 1251.0, 836.0, 519.0, 356.0, 214.0, 141.0, 83.0, 65.0, 30.0, 24.0, 19.0, 17.0, 4.0, 0.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-33.8125, -32.75244140625, -31.6923828125, -30.63232421875, -29.572265625, -28.51220703125, -27.4521484375, -26.39208984375, -25.33203125, -24.27197265625, -23.2119140625, -22.15185546875, -21.091796875, -20.03173828125, -18.9716796875, -17.91162109375, -16.8515625, -15.79150390625, -14.7314453125, -13.67138671875, -12.611328125, -11.55126953125, -10.4912109375, -9.43115234375, -8.37109375, -7.31103515625, -6.2509765625, -5.19091796875, -4.130859375, -3.07080078125, -2.0107421875, -0.95068359375, 0.109375, 1.16943359375, 2.2294921875, 3.28955078125, 4.349609375, 5.40966796875, 6.4697265625, 7.52978515625, 8.58984375, 9.64990234375, 10.7099609375, 11.77001953125, 12.830078125, 13.89013671875, 14.9501953125, 16.01025390625, 17.0703125, 18.13037109375, 19.1904296875, 20.25048828125, 21.310546875, 22.37060546875, 23.4306640625, 24.49072265625, 25.55078125, 26.61083984375, 27.6708984375, 28.73095703125, 29.791015625, 30.85107421875, 31.9111328125, 32.97119140625, 34.03125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 5.0, 4.0, 7.0, 4.0, 8.0, 8.0, 10.0, 24.0, 15.0, 21.0, 17.0, 26.0, 23.0, 26.0, 27.0, 37.0, 37.0, 38.0, 26.0, 48.0, 44.0, 46.0, 36.0, 42.0, 49.0, 42.0, 33.0, 27.0, 38.0, 36.0, 32.0, 23.0, 15.0, 23.0, 14.0, 21.0, 17.0, 9.0, 9.0, 8.0, 7.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0], "bins": [-13.5703125, -13.17578125, -12.78125, -12.38671875, -11.9921875, -11.59765625, -11.203125, -10.80859375, -10.4140625, -10.01953125, -9.625, -9.23046875, -8.8359375, -8.44140625, -8.046875, -7.65234375, -7.2578125, -6.86328125, -6.46875, -6.07421875, -5.6796875, -5.28515625, -4.890625, -4.49609375, -4.1015625, -3.70703125, -3.3125, -2.91796875, -2.5234375, -2.12890625, -1.734375, -1.33984375, -0.9453125, -0.55078125, -0.15625, 0.23828125, 0.6328125, 1.02734375, 1.421875, 1.81640625, 2.2109375, 2.60546875, 3.0, 3.39453125, 3.7890625, 4.18359375, 4.578125, 4.97265625, 5.3671875, 5.76171875, 6.15625, 6.55078125, 6.9453125, 7.33984375, 7.734375, 8.12890625, 8.5234375, 8.91796875, 9.3125, 9.70703125, 10.1015625, 10.49609375, 10.890625, 11.28515625, 11.6796875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 7.0, 6.0, 11.0, 5.0, 14.0, 17.0, 17.0, 37.0, 44.0, 62.0, 96.0, 141.0, 193.0, 274.0, 355.0, 433.0, 626.0, 849.0, 1456.0, 2391.0, 4665.0, 10230.0, 29861.0, 161244.0, 715732.0, 82095.0, 20196.0, 7760.0, 3688.0, 1962.0, 1199.0, 793.0, 560.0, 389.0, 311.0, 260.0, 178.0, 124.0, 72.0, 58.0, 34.0, 29.0, 29.0, 10.0, 13.0, 11.0, 11.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-84.25, -81.64453125, -79.0390625, -76.43359375, -73.828125, -71.22265625, -68.6171875, -66.01171875, -63.40625, -60.80078125, -58.1953125, -55.58984375, -52.984375, -50.37890625, -47.7734375, -45.16796875, -42.5625, -39.95703125, -37.3515625, -34.74609375, -32.140625, -29.53515625, -26.9296875, -24.32421875, -21.71875, -19.11328125, -16.5078125, -13.90234375, -11.296875, -8.69140625, -6.0859375, -3.48046875, -0.875, 1.73046875, 4.3359375, 6.94140625, 9.546875, 12.15234375, 14.7578125, 17.36328125, 19.96875, 22.57421875, 25.1796875, 27.78515625, 30.390625, 32.99609375, 35.6015625, 38.20703125, 40.8125, 43.41796875, 46.0234375, 48.62890625, 51.234375, 53.83984375, 56.4453125, 59.05078125, 61.65625, 64.26171875, 66.8671875, 69.47265625, 72.078125, 74.68359375, 77.2890625, 79.89453125, 82.5]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 6.0, 3.0, 5.0, 4.0, 5.0, 10.0, 10.0, 22.0, 47.0, 59.0, 97.0, 138.0, 183.0, 147.0, 98.0, 62.0, 42.0, 31.0, 15.0, 7.0, 8.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00299072265625, -0.0028858184814453125, -0.002780914306640625, -0.0026760101318359375, -0.00257110595703125, -0.0024662017822265625, -0.002361297607421875, -0.0022563934326171875, -0.0021514892578125, -0.0020465850830078125, -0.001941680908203125, -0.0018367767333984375, -0.00173187255859375, -0.0016269683837890625, -0.001522064208984375, -0.0014171600341796875, -0.001312255859375, -0.0012073516845703125, -0.001102447509765625, -0.0009975433349609375, -0.00089263916015625, -0.0007877349853515625, -0.000682830810546875, -0.0005779266357421875, -0.0004730224609375, -0.0003681182861328125, -0.000263214111328125, -0.0001583099365234375, -5.340576171875e-05, 5.14984130859375e-05, 0.000156402587890625, 0.0002613067626953125, 0.0003662109375, 0.0004711151123046875, 0.000576019287109375, 0.0006809234619140625, 0.00078582763671875, 0.0008907318115234375, 0.000995635986328125, 0.0011005401611328125, 0.0012054443359375, 0.0013103485107421875, 0.001415252685546875, 0.0015201568603515625, 0.00162506103515625, 0.0017299652099609375, 0.001834869384765625, 0.0019397735595703125, 0.002044677734375, 0.0021495819091796875, 0.002254486083984375, 0.0023593902587890625, 0.00246429443359375, 0.0025691986083984375, 0.002674102783203125, 0.0027790069580078125, 0.0028839111328125, 0.0029888153076171875, 0.003093719482421875, 0.0031986236572265625, 0.00330352783203125, 0.0034084320068359375, 0.003513336181640625, 0.0036182403564453125, 0.00372314453125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 6.0, 5.0, 15.0, 18.0, 18.0, 41.0, 56.0, 50.0, 84.0, 126.0, 163.0, 220.0, 336.0, 473.0, 677.0, 984.0, 1531.0, 2637.0, 4690.0, 10142.0, 27379.0, 125655.0, 702211.0, 121796.0, 27028.0, 10172.0, 4700.0, 2631.0, 1438.0, 990.0, 687.0, 444.0, 317.0, 248.0, 168.0, 117.0, 94.0, 55.0, 47.0, 34.0, 25.0, 17.0, 15.0, 9.0, 6.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.625, -77.0966796875, -74.568359375, -72.0400390625, -69.51171875, -66.9833984375, -64.455078125, -61.9267578125, -59.3984375, -56.8701171875, -54.341796875, -51.8134765625, -49.28515625, -46.7568359375, -44.228515625, -41.7001953125, -39.171875, -36.6435546875, -34.115234375, -31.5869140625, -29.05859375, -26.5302734375, -24.001953125, -21.4736328125, -18.9453125, -16.4169921875, -13.888671875, -11.3603515625, -8.83203125, -6.3037109375, -3.775390625, -1.2470703125, 1.28125, 3.8095703125, 6.337890625, 8.8662109375, 11.39453125, 13.9228515625, 16.451171875, 18.9794921875, 21.5078125, 24.0361328125, 26.564453125, 29.0927734375, 31.62109375, 34.1494140625, 36.677734375, 39.2060546875, 41.734375, 44.2626953125, 46.791015625, 49.3193359375, 51.84765625, 54.3759765625, 56.904296875, 59.4326171875, 61.9609375, 64.4892578125, 67.017578125, 69.5458984375, 72.07421875, 74.6025390625, 77.130859375, 79.6591796875, 82.1875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 1.0, 4.0, 4.0, 5.0, 9.0, 15.0, 17.0, 26.0, 40.0, 52.0, 79.0, 103.0, 129.0, 123.0, 117.0, 97.0, 50.0, 31.0, 27.0, 21.0, 12.0, 3.0, 3.0, 9.0, 1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.546875, -20.934326171875, -20.32177734375, -19.709228515625, -19.0966796875, -18.484130859375, -17.87158203125, -17.259033203125, -16.646484375, -16.033935546875, -15.42138671875, -14.808837890625, -14.1962890625, -13.583740234375, -12.97119140625, -12.358642578125, -11.74609375, -11.133544921875, -10.52099609375, -9.908447265625, -9.2958984375, -8.683349609375, -8.07080078125, -7.458251953125, -6.845703125, -6.233154296875, -5.62060546875, -5.008056640625, -4.3955078125, -3.782958984375, -3.17041015625, -2.557861328125, -1.9453125, -1.332763671875, -0.72021484375, -0.107666015625, 0.5048828125, 1.117431640625, 1.72998046875, 2.342529296875, 2.955078125, 3.567626953125, 4.18017578125, 4.792724609375, 5.4052734375, 6.017822265625, 6.63037109375, 7.242919921875, 7.85546875, 8.468017578125, 9.08056640625, 9.693115234375, 10.3056640625, 10.918212890625, 11.53076171875, 12.143310546875, 12.755859375, 13.368408203125, 13.98095703125, 14.593505859375, 15.2060546875, 15.818603515625, 16.43115234375, 17.043701171875, 17.65625]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 2.0, 3.0, 3.0, 7.0, 8.0, 13.0, 10.0, 14.0, 19.0, 33.0, 53.0, 53.0, 72.0, 82.0, 100.0, 98.0, 93.0, 55.0, 64.0, 41.0, 44.0, 14.0, 23.0, 21.0, 14.0, 13.0, 8.0, 7.0, 4.0, 3.0, 2.0, 6.0, 4.0, 3.0, 6.0, 0.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.921016693115234, -21.94912338256836, -20.97722816467285, -20.005332946777344, -19.03343963623047, -18.061546325683594, -17.089651107788086, -16.117755889892578, -15.145862579345703, -14.173968315124512, -13.20207405090332, -12.230179786682129, -11.258285522460938, -10.286391258239746, -9.314496994018555, -8.342602729797363, -7.370708465576172, -6.3988142013549805, -5.426919937133789, -4.455025672912598, -3.4831314086914062, -2.511237144470215, -1.5393428802490234, -0.567448616027832, 0.4044456481933594, 1.3763399124145508, 2.348234176635742, 3.3201284408569336, 4.292022705078125, 5.263916969299316, 6.235811233520508, 7.207705497741699, 8.17959976196289, 9.151494026184082, 10.123388290405273, 11.095282554626465, 12.067176818847656, 13.039071083068848, 14.010965347290039, 14.98285961151123, 15.954753875732422, 16.926647186279297, 17.898542404174805, 18.870437622070312, 19.842330932617188, 20.814224243164062, 21.78611946105957, 22.758014678955078, 23.729907989501953, 24.701801300048828, 25.673696517944336, 26.645591735839844, 27.61748504638672, 28.589378356933594, 29.5612735748291, 30.53316879272461, 31.505062103271484, 32.47695541381836, 33.4488525390625, 34.420745849609375, 35.39263916015625, 36.364532470703125, 37.33642578125, 38.30832290649414, 39.280216217041016]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 10.0, 6.0, 8.0, 8.0, 8.0, 9.0, 12.0, 17.0, 19.0, 18.0, 28.0, 25.0, 29.0, 32.0, 32.0, 32.0, 30.0, 44.0, 32.0, 45.0, 32.0, 28.0, 30.0, 29.0, 35.0, 24.0, 44.0, 29.0, 34.0, 32.0, 29.0, 37.0, 21.0, 26.0, 21.0, 11.0, 18.0, 13.0, 11.0, 7.0, 7.0, 11.0, 9.0, 7.0, 1.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-20.311603546142578, -19.699729919433594, -19.087858200073242, -18.475984573364258, -17.864112854003906, -17.252239227294922, -16.640365600585938, -16.028491973876953, -15.416620254516602, -14.804747581481934, -14.192874908447266, -13.581001281738281, -12.969128608703613, -12.357255935668945, -11.745382308959961, -11.133509635925293, -10.521636962890625, -9.909764289855957, -9.297891616821289, -8.686017990112305, -8.074145317077637, -7.462272644042969, -6.850399494171143, -6.238526344299316, -5.626653671264648, -5.0147809982299805, -4.402907848358154, -3.7910349369049072, -3.17916202545166, -2.567289113998413, -1.955416202545166, -1.3435430526733398, -0.7316703796386719, -0.1197974681854248, 0.49207544326782227, 1.1039483547210693, 1.7158212661743164, 2.3276941776275635, 2.9395670890808105, 3.5514402389526367, 4.163312911987305, 4.775185585021973, 5.387058734893799, 5.998931884765625, 6.610804557800293, 7.222677230834961, 7.834550380706787, 8.446423530578613, 9.058296203613281, 9.67016887664795, 10.282041549682617, 10.893915176391602, 11.50578784942627, 12.117660522460938, 12.729534149169922, 13.34140682220459, 13.953279495239258, 14.565152168273926, 15.177024841308594, 15.788898468017578, 16.400772094726562, 17.012643814086914, 17.6245174407959, 18.23638916015625, 18.848262786865234]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 8.0, 5.0, 8.0, 21.0, 29.0, 39.0, 55.0, 84.0, 116.0, 166.0, 260.0, 387.0, 544.0, 780.0, 1141.0, 1745.0, 2635.0, 4249.0, 6607.0, 10643.0, 17185.0, 28978.0, 49402.0, 88919.0, 176958.0, 468194.0, 1411898.0, 1194957.0, 370518.0, 158295.0, 82360.0, 46427.0, 27000.0, 16280.0, 9707.0, 6336.0, 3927.0, 2595.0, 1730.0, 1093.0, 673.0, 506.0, 291.0, 189.0, 138.0, 79.0, 48.0, 31.0, 21.0, 16.0, 5.0, 7.0, 3.0, 2.0, 2.0, 2.0], "bins": [-28.46875, -27.653076171875, -26.83740234375, -26.021728515625, -25.2060546875, -24.390380859375, -23.57470703125, -22.759033203125, -21.943359375, -21.127685546875, -20.31201171875, -19.496337890625, -18.6806640625, -17.864990234375, -17.04931640625, -16.233642578125, -15.41796875, -14.602294921875, -13.78662109375, -12.970947265625, -12.1552734375, -11.339599609375, -10.52392578125, -9.708251953125, -8.892578125, -8.076904296875, -7.26123046875, -6.445556640625, -5.6298828125, -4.814208984375, -3.99853515625, -3.182861328125, -2.3671875, -1.551513671875, -0.73583984375, 0.079833984375, 0.8955078125, 1.711181640625, 2.52685546875, 3.342529296875, 4.158203125, 4.973876953125, 5.78955078125, 6.605224609375, 7.4208984375, 8.236572265625, 9.05224609375, 9.867919921875, 10.68359375, 11.499267578125, 12.31494140625, 13.130615234375, 13.9462890625, 14.761962890625, 15.57763671875, 16.393310546875, 17.208984375, 18.024658203125, 18.84033203125, 19.656005859375, 20.4716796875, 21.287353515625, 22.10302734375, 22.918701171875, 23.734375]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 1.0, 3.0, 7.0, 5.0, 6.0, 6.0, 14.0, 15.0, 16.0, 12.0, 29.0, 25.0, 33.0, 35.0, 24.0, 44.0, 37.0, 34.0, 36.0, 40.0, 43.0, 35.0, 39.0, 35.0, 51.0, 47.0, 29.0, 33.0, 35.0, 32.0, 31.0, 26.0, 24.0, 20.0, 14.0, 17.0, 16.0, 16.0, 8.0, 5.0, 8.0, 10.0, 1.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-13.7265625, -13.34423828125, -12.9619140625, -12.57958984375, -12.197265625, -11.81494140625, -11.4326171875, -11.05029296875, -10.66796875, -10.28564453125, -9.9033203125, -9.52099609375, -9.138671875, -8.75634765625, -8.3740234375, -7.99169921875, -7.609375, -7.22705078125, -6.8447265625, -6.46240234375, -6.080078125, -5.69775390625, -5.3154296875, -4.93310546875, -4.55078125, -4.16845703125, -3.7861328125, -3.40380859375, -3.021484375, -2.63916015625, -2.2568359375, -1.87451171875, -1.4921875, -1.10986328125, -0.7275390625, -0.34521484375, 0.037109375, 0.41943359375, 0.8017578125, 1.18408203125, 1.56640625, 1.94873046875, 2.3310546875, 2.71337890625, 3.095703125, 3.47802734375, 3.8603515625, 4.24267578125, 4.625, 5.00732421875, 5.3896484375, 5.77197265625, 6.154296875, 6.53662109375, 6.9189453125, 7.30126953125, 7.68359375, 8.06591796875, 8.4482421875, 8.83056640625, 9.212890625, 9.59521484375, 9.9775390625, 10.35986328125, 10.7421875]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 5.0, 13.0, 11.0, 25.0, 37.0, 41.0, 60.0, 109.0, 152.0, 221.0, 284.0, 357.0, 517.0, 802.0, 1130.0, 1527.0, 2215.0, 3323.0, 4845.0, 7117.0, 11085.0, 17729.0, 28454.0, 48312.0, 86073.0, 162506.0, 335044.0, 793347.0, 1422173.0, 649895.0, 285420.0, 141038.0, 75509.0, 42679.0, 25428.0, 15699.0, 10060.0, 6552.0, 4368.0, 3052.0, 2098.0, 1483.0, 1050.0, 695.0, 536.0, 349.0, 279.0, 185.0, 130.0, 90.0, 66.0, 46.0, 21.0, 16.0, 20.0, 2.0, 7.0, 6.0, 2.0, 1.0], "bins": [-20.0, -19.382568359375, -18.76513671875, -18.147705078125, -17.5302734375, -16.912841796875, -16.29541015625, -15.677978515625, -15.060546875, -14.443115234375, -13.82568359375, -13.208251953125, -12.5908203125, -11.973388671875, -11.35595703125, -10.738525390625, -10.12109375, -9.503662109375, -8.88623046875, -8.268798828125, -7.6513671875, -7.033935546875, -6.41650390625, -5.799072265625, -5.181640625, -4.564208984375, -3.94677734375, -3.329345703125, -2.7119140625, -2.094482421875, -1.47705078125, -0.859619140625, -0.2421875, 0.375244140625, 0.99267578125, 1.610107421875, 2.2275390625, 2.844970703125, 3.46240234375, 4.079833984375, 4.697265625, 5.314697265625, 5.93212890625, 6.549560546875, 7.1669921875, 7.784423828125, 8.40185546875, 9.019287109375, 9.63671875, 10.254150390625, 10.87158203125, 11.489013671875, 12.1064453125, 12.723876953125, 13.34130859375, 13.958740234375, 14.576171875, 15.193603515625, 15.81103515625, 16.428466796875, 17.0458984375, 17.663330078125, 18.28076171875, 18.898193359375, 19.515625]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 6.0, 2.0, 4.0, 10.0, 6.0, 18.0, 17.0, 18.0, 24.0, 32.0, 40.0, 72.0, 69.0, 82.0, 117.0, 148.0, 156.0, 199.0, 256.0, 265.0, 339.0, 339.0, 339.0, 257.0, 205.0, 195.0, 163.0, 130.0, 93.0, 99.0, 62.0, 58.0, 50.0, 36.0, 48.0, 27.0, 25.0, 14.0, 11.0, 13.0, 7.0, 6.0, 9.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.12109375, -5.90765380859375, -5.6942138671875, -5.48077392578125, -5.267333984375, -5.05389404296875, -4.8404541015625, -4.62701416015625, -4.41357421875, -4.20013427734375, -3.9866943359375, -3.77325439453125, -3.559814453125, -3.34637451171875, -3.1329345703125, -2.91949462890625, -2.7060546875, -2.49261474609375, -2.2791748046875, -2.06573486328125, -1.852294921875, -1.63885498046875, -1.4254150390625, -1.21197509765625, -0.99853515625, -0.78509521484375, -0.5716552734375, -0.35821533203125, -0.144775390625, 0.06866455078125, 0.2821044921875, 0.49554443359375, 0.708984375, 0.92242431640625, 1.1358642578125, 1.34930419921875, 1.562744140625, 1.77618408203125, 1.9896240234375, 2.20306396484375, 2.41650390625, 2.62994384765625, 2.8433837890625, 3.05682373046875, 3.270263671875, 3.48370361328125, 3.6971435546875, 3.91058349609375, 4.1240234375, 4.33746337890625, 4.5509033203125, 4.76434326171875, 4.977783203125, 5.19122314453125, 5.4046630859375, 5.61810302734375, 5.83154296875, 6.04498291015625, 6.2584228515625, 6.47186279296875, 6.685302734375, 6.89874267578125, 7.1121826171875, 7.32562255859375, 7.5390625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 3.0, 6.0, 11.0, 15.0, 13.0, 25.0, 28.0, 37.0, 37.0, 73.0, 80.0, 114.0, 118.0, 126.0, 78.0, 53.0, 38.0, 40.0, 22.0, 20.0, 14.0, 9.0, 9.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.501096725463867, -20.716760635375977, -19.932422637939453, -19.148086547851562, -18.363750457763672, -17.57941436767578, -16.79507827758789, -16.010740280151367, -15.226404190063477, -14.442068099975586, -13.657731056213379, -12.873394012451172, -12.089057922363281, -11.30472183227539, -10.520384788513184, -9.736047744750977, -8.951711654663086, -8.167375564575195, -7.383038520812988, -6.5987019538879395, -5.814365386962891, -5.030028820037842, -4.245692253112793, -3.461355686187744, -2.6770191192626953, -1.8926825523376465, -1.1083459854125977, -0.32400941848754883, 0.4603271484375, 1.2446637153625488, 2.0290002822875977, 2.8133368492126465, 3.597675323486328, 4.382011890411377, 5.166348457336426, 5.950685024261475, 6.735021591186523, 7.519358158111572, 8.303694725036621, 9.088031768798828, 9.872367858886719, 10.65670394897461, 11.441040992736816, 12.225378036499023, 13.009714126586914, 13.794050216674805, 14.578387260437012, 15.362724304199219, 16.14706039428711, 16.931396484375, 17.71573257446289, 18.500070571899414, 19.284406661987305, 20.068742752075195, 20.85308074951172, 21.63741683959961, 22.4217529296875, 23.20608901977539, 23.99042510986328, 24.774763107299805, 25.559099197387695, 26.343435287475586, 27.12777328491211, 27.912109375, 28.69644546508789]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 2.0, 7.0, 4.0, 10.0, 7.0, 8.0, 11.0, 16.0, 16.0, 16.0, 23.0, 27.0, 25.0, 23.0, 25.0, 34.0, 28.0, 34.0, 26.0, 26.0, 27.0, 35.0, 28.0, 30.0, 36.0, 27.0, 47.0, 42.0, 33.0, 32.0, 28.0, 22.0, 23.0, 19.0, 32.0, 24.0, 20.0, 24.0, 11.0, 9.0, 12.0, 17.0, 10.0, 8.0, 8.0, 8.0, 3.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-12.227036476135254, -11.833412170410156, -11.439786911010742, -11.046162605285645, -10.652538299560547, -10.258913040161133, -9.865288734436035, -9.471664428710938, -9.078039169311523, -8.684414863586426, -8.290789604187012, -7.897165298461914, -7.503540992736816, -7.1099162101745605, -6.716291427612305, -6.322667121887207, -5.929042816162109, -5.5354180335998535, -5.141793727874756, -4.7481689453125, -4.354544639587402, -3.9609198570251465, -3.5672950744628906, -3.173670530319214, -2.780045986175537, -2.3864214420318604, -1.992796778678894, -1.5991721153259277, -1.205547571182251, -0.8119230270385742, -0.41829824447631836, -0.0246737003326416, 0.36895179748535156, 0.7625764012336731, 1.1562010049819946, 1.549825668334961, 1.9434502124786377, 2.3370747566223145, 2.7306995391845703, 3.124324083328247, 3.517948627471924, 3.9115731716156006, 4.305197715759277, 4.698822498321533, 5.092447280883789, 5.486071586608887, 5.879696369171143, 6.273321151733398, 6.666945457458496, 7.060570240020752, 7.45419454574585, 7.8478193283081055, 8.241443634033203, 8.635068893432617, 9.028693199157715, 9.422317504882812, 9.815942764282227, 10.209567070007324, 10.603192329406738, 10.996816635131836, 11.390440940856934, 11.784065246582031, 12.177690505981445, 12.571314811706543, 12.96493911743164]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 13.0, 9.0, 12.0, 14.0, 25.0, 46.0, 71.0, 128.0, 230.0, 401.0, 725.0, 1306.0, 2378.0, 4444.0, 8322.0, 16308.0, 33110.0, 69649.0, 165591.0, 345390.0, 222653.0, 92546.0, 42053.0, 20405.0, 10609.0, 5505.0, 2930.0, 1598.0, 912.0, 488.0, 292.0, 178.0, 83.0, 50.0, 22.0, 21.0, 16.0, 10.0, 11.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.40625, -15.88818359375, -15.3701171875, -14.85205078125, -14.333984375, -13.81591796875, -13.2978515625, -12.77978515625, -12.26171875, -11.74365234375, -11.2255859375, -10.70751953125, -10.189453125, -9.67138671875, -9.1533203125, -8.63525390625, -8.1171875, -7.59912109375, -7.0810546875, -6.56298828125, -6.044921875, -5.52685546875, -5.0087890625, -4.49072265625, -3.97265625, -3.45458984375, -2.9365234375, -2.41845703125, -1.900390625, -1.38232421875, -0.8642578125, -0.34619140625, 0.171875, 0.68994140625, 1.2080078125, 1.72607421875, 2.244140625, 2.76220703125, 3.2802734375, 3.79833984375, 4.31640625, 4.83447265625, 5.3525390625, 5.87060546875, 6.388671875, 6.90673828125, 7.4248046875, 7.94287109375, 8.4609375, 8.97900390625, 9.4970703125, 10.01513671875, 10.533203125, 11.05126953125, 11.5693359375, 12.08740234375, 12.60546875, 13.12353515625, 13.6416015625, 14.15966796875, 14.677734375, 15.19580078125, 15.7138671875, 16.23193359375, 16.75]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 7.0, 11.0, 11.0, 12.0, 15.0, 10.0, 11.0, 31.0, 20.0, 20.0, 23.0, 29.0, 26.0, 30.0, 27.0, 31.0, 34.0, 35.0, 35.0, 35.0, 35.0, 47.0, 40.0, 49.0, 39.0, 38.0, 32.0, 29.0, 31.0, 25.0, 20.0, 17.0, 25.0, 15.0, 16.0, 15.0, 12.0, 11.0, 10.0, 13.0, 8.0, 5.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.4453125, -12.0272216796875, -11.609130859375, -11.1910400390625, -10.77294921875, -10.3548583984375, -9.936767578125, -9.5186767578125, -9.1005859375, -8.6824951171875, -8.264404296875, -7.8463134765625, -7.42822265625, -7.0101318359375, -6.592041015625, -6.1739501953125, -5.755859375, -5.3377685546875, -4.919677734375, -4.5015869140625, -4.08349609375, -3.6654052734375, -3.247314453125, -2.8292236328125, -2.4111328125, -1.9930419921875, -1.574951171875, -1.1568603515625, -0.73876953125, -0.3206787109375, 0.097412109375, 0.5155029296875, 0.93359375, 1.3516845703125, 1.769775390625, 2.1878662109375, 2.60595703125, 3.0240478515625, 3.442138671875, 3.8602294921875, 4.2783203125, 4.6964111328125, 5.114501953125, 5.5325927734375, 5.95068359375, 6.3687744140625, 6.786865234375, 7.2049560546875, 7.623046875, 8.0411376953125, 8.459228515625, 8.8773193359375, 9.29541015625, 9.7135009765625, 10.131591796875, 10.5496826171875, 10.9677734375, 11.3858642578125, 11.803955078125, 12.2220458984375, 12.64013671875, 13.0582275390625, 13.476318359375, 13.8944091796875, 14.3125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 6.0, 2.0, 1.0, 4.0, 5.0, 8.0, 21.0, 17.0, 30.0, 45.0, 57.0, 94.0, 104.0, 161.0, 228.0, 289.0, 455.0, 656.0, 933.0, 1455.0, 2197.0, 3515.0, 5425.0, 9344.0, 16766.0, 32042.0, 69332.0, 187407.0, 432264.0, 156984.0, 61094.0, 29078.0, 15144.0, 8638.0, 5207.0, 3205.0, 2042.0, 1386.0, 920.0, 600.0, 416.0, 275.0, 173.0, 143.0, 103.0, 89.0, 51.0, 39.0, 30.0, 23.0, 21.0, 11.0, 11.0, 6.0, 4.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0], "bins": [-14.078125, -13.630126953125, -13.18212890625, -12.734130859375, -12.2861328125, -11.838134765625, -11.39013671875, -10.942138671875, -10.494140625, -10.046142578125, -9.59814453125, -9.150146484375, -8.7021484375, -8.254150390625, -7.80615234375, -7.358154296875, -6.91015625, -6.462158203125, -6.01416015625, -5.566162109375, -5.1181640625, -4.670166015625, -4.22216796875, -3.774169921875, -3.326171875, -2.878173828125, -2.43017578125, -1.982177734375, -1.5341796875, -1.086181640625, -0.63818359375, -0.190185546875, 0.2578125, 0.705810546875, 1.15380859375, 1.601806640625, 2.0498046875, 2.497802734375, 2.94580078125, 3.393798828125, 3.841796875, 4.289794921875, 4.73779296875, 5.185791015625, 5.6337890625, 6.081787109375, 6.52978515625, 6.977783203125, 7.42578125, 7.873779296875, 8.32177734375, 8.769775390625, 9.2177734375, 9.665771484375, 10.11376953125, 10.561767578125, 11.009765625, 11.457763671875, 11.90576171875, 12.353759765625, 12.8017578125, 13.249755859375, 13.69775390625, 14.145751953125, 14.59375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 4.0, 2.0, 6.0, 4.0, 5.0, 5.0, 7.0, 9.0, 9.0, 10.0, 8.0, 18.0, 19.0, 16.0, 22.0, 24.0, 30.0, 31.0, 30.0, 30.0, 50.0, 41.0, 41.0, 46.0, 38.0, 29.0, 47.0, 44.0, 28.0, 36.0, 35.0, 33.0, 23.0, 23.0, 24.0, 34.0, 18.0, 22.0, 24.0, 12.0, 12.0, 11.0, 8.0, 8.0, 6.0, 5.0, 8.0, 3.0, 6.0, 4.0, 0.0, 1.0], "bins": [-11.359375, -11.0543212890625, -10.749267578125, -10.4442138671875, -10.13916015625, -9.8341064453125, -9.529052734375, -9.2239990234375, -8.9189453125, -8.6138916015625, -8.308837890625, -8.0037841796875, -7.69873046875, -7.3936767578125, -7.088623046875, -6.7835693359375, -6.478515625, -6.1734619140625, -5.868408203125, -5.5633544921875, -5.25830078125, -4.9532470703125, -4.648193359375, -4.3431396484375, -4.0380859375, -3.7330322265625, -3.427978515625, -3.1229248046875, -2.81787109375, -2.5128173828125, -2.207763671875, -1.9027099609375, -1.59765625, -1.2926025390625, -0.987548828125, -0.6824951171875, -0.37744140625, -0.0723876953125, 0.232666015625, 0.5377197265625, 0.8427734375, 1.1478271484375, 1.452880859375, 1.7579345703125, 2.06298828125, 2.3680419921875, 2.673095703125, 2.9781494140625, 3.283203125, 3.5882568359375, 3.893310546875, 4.1983642578125, 4.50341796875, 4.8084716796875, 5.113525390625, 5.4185791015625, 5.7236328125, 6.0286865234375, 6.333740234375, 6.6387939453125, 6.94384765625, 7.2489013671875, 7.553955078125, 7.8590087890625, 8.1640625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 1.0, 0.0, 6.0, 8.0, 6.0, 8.0, 10.0, 23.0, 31.0, 40.0, 75.0, 86.0, 127.0, 181.0, 272.0, 498.0, 871.0, 1515.0, 3283.0, 7619.0, 22198.0, 113529.0, 757961.0, 104660.0, 21406.0, 7177.0, 3085.0, 1602.0, 910.0, 500.0, 327.0, 173.0, 114.0, 83.0, 51.0, 20.0, 34.0, 4.0, 21.0, 9.0, 9.0, 10.0, 5.0, 7.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.77734375, -4.61529541015625, -4.4532470703125, -4.29119873046875, -4.129150390625, -3.96710205078125, -3.8050537109375, -3.64300537109375, -3.48095703125, -3.31890869140625, -3.1568603515625, -2.99481201171875, -2.832763671875, -2.67071533203125, -2.5086669921875, -2.34661865234375, -2.1845703125, -2.02252197265625, -1.8604736328125, -1.69842529296875, -1.536376953125, -1.37432861328125, -1.2122802734375, -1.05023193359375, -0.88818359375, -0.72613525390625, -0.5640869140625, -0.40203857421875, -0.239990234375, -0.07794189453125, 0.0841064453125, 0.24615478515625, 0.408203125, 0.57025146484375, 0.7322998046875, 0.89434814453125, 1.056396484375, 1.21844482421875, 1.3804931640625, 1.54254150390625, 1.70458984375, 1.86663818359375, 2.0286865234375, 2.19073486328125, 2.352783203125, 2.51483154296875, 2.6768798828125, 2.83892822265625, 3.0009765625, 3.16302490234375, 3.3250732421875, 3.48712158203125, 3.649169921875, 3.81121826171875, 3.9732666015625, 4.13531494140625, 4.29736328125, 4.45941162109375, 4.6214599609375, 4.78350830078125, 4.945556640625, 5.10760498046875, 5.2696533203125, 5.43170166015625, 5.59375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 4.0, 9.0, 15.0, 10.0, 20.0, 24.0, 9.0, 24.0, 17.0, 32.0, 42.0, 37.0, 53.0, 61.0, 68.0, 77.0, 70.0, 72.0, 52.0, 51.0, 47.0, 36.0, 25.0, 22.0, 17.0, 14.0, 12.0, 13.0, 10.0, 7.0, 11.0, 12.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023818016052246094, -0.00023052841424942017, -0.0002228766679763794, -0.00021522492170333862, -0.00020757317543029785, -0.00019992142915725708, -0.0001922696828842163, -0.00018461793661117554, -0.00017696619033813477, -0.000169314444065094, -0.00016166269779205322, -0.00015401095151901245, -0.00014635920524597168, -0.0001387074589729309, -0.00013105571269989014, -0.00012340396642684937, -0.0001157522201538086, -0.00010810047388076782, -0.00010044872760772705, -9.279698133468628e-05, -8.514523506164551e-05, -7.749348878860474e-05, -6.984174251556396e-05, -6.21899962425232e-05, -5.453824996948242e-05, -4.688650369644165e-05, -3.923475742340088e-05, -3.158301115036011e-05, -2.3931264877319336e-05, -1.6279518604278564e-05, -8.627772331237793e-06, -9.760260581970215e-07, 6.67572021484375e-06, 1.4327466487884521e-05, 2.1979212760925293e-05, 2.9630959033966064e-05, 3.7282705307006836e-05, 4.493445158004761e-05, 5.258619785308838e-05, 6.023794412612915e-05, 6.788969039916992e-05, 7.55414366722107e-05, 8.319318294525146e-05, 9.084492921829224e-05, 9.849667549133301e-05, 0.00010614842176437378, 0.00011380016803741455, 0.00012145191431045532, 0.0001291036605834961, 0.00013675540685653687, 0.00014440715312957764, 0.0001520588994026184, 0.00015971064567565918, 0.00016736239194869995, 0.00017501413822174072, 0.0001826658844947815, 0.00019031763076782227, 0.00019796937704086304, 0.0002056211233139038, 0.00021327286958694458, 0.00022092461585998535, 0.00022857636213302612, 0.0002362281084060669, 0.00024387985467910767, 0.00025153160095214844]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [6.0, 0.0, 4.0, 0.0, 2.0, 8.0, 2.0, 10.0, 15.0, 12.0, 16.0, 36.0, 52.0, 37.0, 67.0, 79.0, 127.0, 173.0, 223.0, 337.0, 503.0, 614.0, 962.0, 1353.0, 2017.0, 3152.0, 4880.0, 7576.0, 12365.0, 22033.0, 43772.0, 112429.0, 490479.0, 210003.0, 63077.0, 29345.0, 16028.0, 9363.0, 5770.0, 3708.0, 2404.0, 1644.0, 1138.0, 772.0, 535.0, 395.0, 268.0, 199.0, 155.0, 122.0, 94.0, 61.0, 34.0, 32.0, 30.0, 17.0, 15.0, 8.0, 4.0, 8.0, 2.0, 1.0, 0.0, 3.0], "bins": [-4.95703125, -4.8055419921875, -4.654052734375, -4.5025634765625, -4.35107421875, -4.1995849609375, -4.048095703125, -3.8966064453125, -3.7451171875, -3.5936279296875, -3.442138671875, -3.2906494140625, -3.13916015625, -2.9876708984375, -2.836181640625, -2.6846923828125, -2.533203125, -2.3817138671875, -2.230224609375, -2.0787353515625, -1.92724609375, -1.7757568359375, -1.624267578125, -1.4727783203125, -1.3212890625, -1.1697998046875, -1.018310546875, -0.8668212890625, -0.71533203125, -0.5638427734375, -0.412353515625, -0.2608642578125, -0.109375, 0.0421142578125, 0.193603515625, 0.3450927734375, 0.49658203125, 0.6480712890625, 0.799560546875, 0.9510498046875, 1.1025390625, 1.2540283203125, 1.405517578125, 1.5570068359375, 1.70849609375, 1.8599853515625, 2.011474609375, 2.1629638671875, 2.314453125, 2.4659423828125, 2.617431640625, 2.7689208984375, 2.92041015625, 3.0718994140625, 3.223388671875, 3.3748779296875, 3.5263671875, 3.6778564453125, 3.829345703125, 3.9808349609375, 4.13232421875, 4.2838134765625, 4.435302734375, 4.5867919921875, 4.73828125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 5.0, 0.0, 2.0, 5.0, 2.0, 4.0, 6.0, 16.0, 9.0, 18.0, 21.0, 13.0, 13.0, 19.0, 19.0, 23.0, 42.0, 41.0, 69.0, 87.0, 106.0, 83.0, 83.0, 60.0, 45.0, 32.0, 21.0, 25.0, 16.0, 21.0, 20.0, 13.0, 13.0, 9.0, 10.0, 6.0, 6.0, 3.0, 3.0, 1.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-1.23046875, -1.1892852783203125, -1.148101806640625, -1.1069183349609375, -1.06573486328125, -1.0245513916015625, -0.983367919921875, -0.9421844482421875, -0.9010009765625, -0.8598175048828125, -0.818634033203125, -0.7774505615234375, -0.73626708984375, -0.6950836181640625, -0.653900146484375, -0.6127166748046875, -0.571533203125, -0.5303497314453125, -0.489166259765625, -0.4479827880859375, -0.40679931640625, -0.3656158447265625, -0.324432373046875, -0.2832489013671875, -0.2420654296875, -0.2008819580078125, -0.159698486328125, -0.1185150146484375, -0.07733154296875, -0.0361480712890625, 0.005035400390625, 0.0462188720703125, 0.08740234375, 0.1285858154296875, 0.169769287109375, 0.2109527587890625, 0.25213623046875, 0.2933197021484375, 0.334503173828125, 0.3756866455078125, 0.4168701171875, 0.4580535888671875, 0.499237060546875, 0.5404205322265625, 0.58160400390625, 0.6227874755859375, 0.663970947265625, 0.7051544189453125, 0.746337890625, 0.7875213623046875, 0.828704833984375, 0.8698883056640625, 0.91107177734375, 0.9522552490234375, 0.993438720703125, 1.0346221923828125, 1.0758056640625, 1.1169891357421875, 1.158172607421875, 1.1993560791015625, 1.24053955078125, 1.2817230224609375, 1.322906494140625, 1.3640899658203125, 1.4052734375]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 8.0, 10.0, 13.0, 16.0, 27.0, 40.0, 35.0, 57.0, 91.0, 111.0, 134.0, 109.0, 89.0, 60.0, 47.0, 28.0, 27.0, 22.0, 15.0, 10.0, 10.0, 7.0, 6.0, 5.0, 4.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.70577049255371, -19.927024841308594, -19.148279190063477, -18.36953353881836, -17.590789794921875, -16.812044143676758, -16.03329849243164, -15.254552841186523, -14.475807189941406, -13.697061538696289, -12.918315887451172, -12.139571189880371, -11.360825538635254, -10.582079887390137, -9.803335189819336, -9.024589538574219, -8.245843887329102, -7.467098236083984, -6.688353061676025, -5.909607887268066, -5.130862236022949, -4.352116584777832, -3.573371410369873, -2.794626235961914, -2.015880584716797, -1.2371351718902588, -0.4583897590637207, 0.3203556537628174, 1.0991010665893555, 1.8778464794158936, 2.6565918922424316, 3.4353370666503906, 4.214082717895508, 4.992828369140625, 5.771573543548584, 6.550318717956543, 7.32906436920166, 8.107810020446777, 8.886554718017578, 9.665300369262695, 10.444046020507812, 11.22279167175293, 12.001537322998047, 12.780282020568848, 13.559027671813965, 14.337773323059082, 15.116518020629883, 15.895263671875, 16.674009323120117, 17.452754974365234, 18.23150062561035, 19.01024627685547, 19.788990020751953, 20.56773567199707, 21.346481323242188, 22.125226974487305, 22.903972625732422, 23.68271827697754, 24.461463928222656, 25.240209579467773, 26.01895523071289, 26.797698974609375, 27.576444625854492, 28.35519027709961, 29.133935928344727]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 5.0, 1.0, 3.0, 6.0, 10.0, 5.0, 7.0, 3.0, 15.0, 15.0, 16.0, 19.0, 20.0, 25.0, 20.0, 25.0, 24.0, 32.0, 24.0, 30.0, 37.0, 26.0, 27.0, 30.0, 37.0, 33.0, 27.0, 38.0, 35.0, 43.0, 28.0, 46.0, 24.0, 25.0, 22.0, 24.0, 20.0, 23.0, 21.0, 22.0, 21.0, 9.0, 14.0, 17.0, 9.0, 8.0, 4.0, 11.0, 4.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-12.19740104675293, -11.80628776550293, -11.415173530578613, -11.024060249328613, -10.632946014404297, -10.241832733154297, -9.850719451904297, -9.45960521697998, -9.068490982055664, -8.677377700805664, -8.286263465881348, -7.895150184631348, -7.504035949707031, -7.112922668457031, -6.721808910369873, -6.330695152282715, -5.939581871032715, -5.548468112945557, -5.157354354858398, -4.766241073608398, -4.375126838684082, -3.984013319015503, -3.592899799346924, -3.2017860412597656, -2.8106722831726074, -2.419558525085449, -2.028444766998291, -1.637331247329712, -1.2462174892425537, -0.8551037311553955, -0.4639902114868164, -0.0728764533996582, 0.3182373046875, 0.7093510031700134, 1.1004647016525269, 1.4915783405303955, 1.8826920986175537, 2.273805856704712, 2.664919376373291, 3.056033134460449, 3.4471468925476074, 3.8382606506347656, 4.229374408721924, 4.620488166809082, 5.011601448059082, 5.402715682983398, 5.793828964233398, 6.184942722320557, 6.576056480407715, 6.967170238494873, 7.358283996582031, 7.749397277832031, 8.140511512756348, 8.531624794006348, 8.922739028930664, 9.313852310180664, 9.704965591430664, 10.096078872680664, 10.48719310760498, 10.87830638885498, 11.269420623779297, 11.660533905029297, 12.051647186279297, 12.442761421203613, 12.83387565612793]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 10.0, 10.0, 18.0, 21.0, 44.0, 62.0, 103.0, 142.0, 224.0, 396.0, 591.0, 934.0, 1430.0, 2275.0, 3580.0, 5696.0, 8737.0, 14381.0, 23140.0, 37981.0, 62203.0, 101931.0, 160419.0, 200519.0, 159791.0, 102333.0, 61977.0, 37818.0, 23093.0, 14194.0, 8944.0, 5656.0, 3613.0, 2317.0, 1441.0, 903.0, 614.0, 362.0, 233.0, 161.0, 100.0, 64.0, 30.0, 26.0, 12.0, 11.0, 8.0, 3.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-19.046875, -18.42236328125, -17.7978515625, -17.17333984375, -16.548828125, -15.92431640625, -15.2998046875, -14.67529296875, -14.05078125, -13.42626953125, -12.8017578125, -12.17724609375, -11.552734375, -10.92822265625, -10.3037109375, -9.67919921875, -9.0546875, -8.43017578125, -7.8056640625, -7.18115234375, -6.556640625, -5.93212890625, -5.3076171875, -4.68310546875, -4.05859375, -3.43408203125, -2.8095703125, -2.18505859375, -1.560546875, -0.93603515625, -0.3115234375, 0.31298828125, 0.9375, 1.56201171875, 2.1865234375, 2.81103515625, 3.435546875, 4.06005859375, 4.6845703125, 5.30908203125, 5.93359375, 6.55810546875, 7.1826171875, 7.80712890625, 8.431640625, 9.05615234375, 9.6806640625, 10.30517578125, 10.9296875, 11.55419921875, 12.1787109375, 12.80322265625, 13.427734375, 14.05224609375, 14.6767578125, 15.30126953125, 15.92578125, 16.55029296875, 17.1748046875, 17.79931640625, 18.423828125, 19.04833984375, 19.6728515625, 20.29736328125, 20.921875]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 5.0, 8.0, 5.0, 7.0, 8.0, 12.0, 10.0, 25.0, 17.0, 24.0, 21.0, 36.0, 27.0, 16.0, 31.0, 35.0, 24.0, 36.0, 33.0, 36.0, 38.0, 40.0, 35.0, 33.0, 41.0, 39.0, 26.0, 35.0, 39.0, 31.0, 28.0, 21.0, 25.0, 11.0, 19.0, 18.0, 18.0, 18.0, 17.0, 8.0, 10.0, 2.0, 10.0, 8.0, 5.0, 4.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-11.78125, -11.4019775390625, -11.022705078125, -10.6434326171875, -10.26416015625, -9.8848876953125, -9.505615234375, -9.1263427734375, -8.7470703125, -8.3677978515625, -7.988525390625, -7.6092529296875, -7.22998046875, -6.8507080078125, -6.471435546875, -6.0921630859375, -5.712890625, -5.3336181640625, -4.954345703125, -4.5750732421875, -4.19580078125, -3.8165283203125, -3.437255859375, -3.0579833984375, -2.6787109375, -2.2994384765625, -1.920166015625, -1.5408935546875, -1.16162109375, -0.7823486328125, -0.403076171875, -0.0238037109375, 0.35546875, 0.7347412109375, 1.114013671875, 1.4932861328125, 1.87255859375, 2.2518310546875, 2.631103515625, 3.0103759765625, 3.3896484375, 3.7689208984375, 4.148193359375, 4.5274658203125, 4.90673828125, 5.2860107421875, 5.665283203125, 6.0445556640625, 6.423828125, 6.8031005859375, 7.182373046875, 7.5616455078125, 7.94091796875, 8.3201904296875, 8.699462890625, 9.0787353515625, 9.4580078125, 9.8372802734375, 10.216552734375, 10.5958251953125, 10.97509765625, 11.3543701171875, 11.733642578125, 12.1129150390625, 12.4921875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 6.0, 9.0, 13.0, 17.0, 34.0, 47.0, 77.0, 111.0, 150.0, 209.0, 335.0, 412.0, 616.0, 997.0, 1514.0, 2298.0, 3669.0, 5483.0, 8739.0, 14169.0, 22966.0, 38583.0, 65987.0, 118930.0, 216935.0, 232267.0, 132005.0, 72461.0, 42081.0, 25389.0, 15387.0, 9530.0, 6025.0, 3730.0, 2462.0, 1627.0, 999.0, 747.0, 469.0, 348.0, 222.0, 160.0, 104.0, 82.0, 47.0, 43.0, 21.0, 12.0, 6.0, 8.0, 7.0, 6.0, 3.0, 4.0, 2.0], "bins": [-23.0, -22.3251953125, -21.650390625, -20.9755859375, -20.30078125, -19.6259765625, -18.951171875, -18.2763671875, -17.6015625, -16.9267578125, -16.251953125, -15.5771484375, -14.90234375, -14.2275390625, -13.552734375, -12.8779296875, -12.203125, -11.5283203125, -10.853515625, -10.1787109375, -9.50390625, -8.8291015625, -8.154296875, -7.4794921875, -6.8046875, -6.1298828125, -5.455078125, -4.7802734375, -4.10546875, -3.4306640625, -2.755859375, -2.0810546875, -1.40625, -0.7314453125, -0.056640625, 0.6181640625, 1.29296875, 1.9677734375, 2.642578125, 3.3173828125, 3.9921875, 4.6669921875, 5.341796875, 6.0166015625, 6.69140625, 7.3662109375, 8.041015625, 8.7158203125, 9.390625, 10.0654296875, 10.740234375, 11.4150390625, 12.08984375, 12.7646484375, 13.439453125, 14.1142578125, 14.7890625, 15.4638671875, 16.138671875, 16.8134765625, 17.48828125, 18.1630859375, 18.837890625, 19.5126953125, 20.1875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 7.0, 6.0, 10.0, 9.0, 11.0, 10.0, 15.0, 18.0, 26.0, 19.0, 13.0, 38.0, 35.0, 39.0, 40.0, 43.0, 36.0, 42.0, 50.0, 43.0, 49.0, 62.0, 51.0, 38.0, 36.0, 36.0, 39.0, 31.0, 29.0, 28.0, 21.0, 17.0, 8.0, 13.0, 5.0, 8.0, 4.0, 6.0, 0.0, 8.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.125, -11.7655029296875, -11.406005859375, -11.0465087890625, -10.68701171875, -10.3275146484375, -9.968017578125, -9.6085205078125, -9.2490234375, -8.8895263671875, -8.530029296875, -8.1705322265625, -7.81103515625, -7.4515380859375, -7.092041015625, -6.7325439453125, -6.373046875, -6.0135498046875, -5.654052734375, -5.2945556640625, -4.93505859375, -4.5755615234375, -4.216064453125, -3.8565673828125, -3.4970703125, -3.1375732421875, -2.778076171875, -2.4185791015625, -2.05908203125, -1.6995849609375, -1.340087890625, -0.9805908203125, -0.62109375, -0.2615966796875, 0.097900390625, 0.4573974609375, 0.81689453125, 1.1763916015625, 1.535888671875, 1.8953857421875, 2.2548828125, 2.6143798828125, 2.973876953125, 3.3333740234375, 3.69287109375, 4.0523681640625, 4.411865234375, 4.7713623046875, 5.130859375, 5.4903564453125, 5.849853515625, 6.2093505859375, 6.56884765625, 6.9283447265625, 7.287841796875, 7.6473388671875, 8.0068359375, 8.3663330078125, 8.725830078125, 9.0853271484375, 9.44482421875, 9.8043212890625, 10.163818359375, 10.5233154296875, 10.8828125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 7.0, 4.0, 10.0, 10.0, 14.0, 15.0, 30.0, 46.0, 64.0, 121.0, 173.0, 237.0, 404.0, 706.0, 1385.0, 2780.0, 7491.0, 28530.0, 295667.0, 654674.0, 40089.0, 9224.0, 3354.0, 1512.0, 800.0, 401.0, 265.0, 165.0, 125.0, 89.0, 56.0, 35.0, 18.0, 17.0, 10.0, 12.0, 5.0, 8.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-129.0, -124.98046875, -120.9609375, -116.94140625, -112.921875, -108.90234375, -104.8828125, -100.86328125, -96.84375, -92.82421875, -88.8046875, -84.78515625, -80.765625, -76.74609375, -72.7265625, -68.70703125, -64.6875, -60.66796875, -56.6484375, -52.62890625, -48.609375, -44.58984375, -40.5703125, -36.55078125, -32.53125, -28.51171875, -24.4921875, -20.47265625, -16.453125, -12.43359375, -8.4140625, -4.39453125, -0.375, 3.64453125, 7.6640625, 11.68359375, 15.703125, 19.72265625, 23.7421875, 27.76171875, 31.78125, 35.80078125, 39.8203125, 43.83984375, 47.859375, 51.87890625, 55.8984375, 59.91796875, 63.9375, 67.95703125, 71.9765625, 75.99609375, 80.015625, 84.03515625, 88.0546875, 92.07421875, 96.09375, 100.11328125, 104.1328125, 108.15234375, 112.171875, 116.19140625, 120.2109375, 124.23046875, 128.25]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 8.0, 3.0, 6.0, 11.0, 17.0, 26.0, 41.0, 66.0, 97.0, 132.0, 168.0, 150.0, 109.0, 66.0, 38.0, 26.0, 16.0, 8.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022430419921875, -0.002161741256713867, -0.0020804405212402344, -0.0019991397857666016, -0.0019178390502929688, -0.001836538314819336, -0.0017552375793457031, -0.0016739368438720703, -0.0015926361083984375, -0.0015113353729248047, -0.0014300346374511719, -0.001348733901977539, -0.0012674331665039062, -0.0011861324310302734, -0.0011048316955566406, -0.0010235309600830078, -0.000942230224609375, -0.0008609294891357422, -0.0007796287536621094, -0.0006983280181884766, -0.0006170272827148438, -0.0005357265472412109, -0.0004544258117675781, -0.0003731250762939453, -0.0002918243408203125, -0.0002105236053466797, -0.00012922286987304688, -4.792213439941406e-05, 3.337860107421875e-05, 0.00011467933654785156, 0.00019598007202148438, 0.0002772808074951172, 0.00035858154296875, 0.0004398822784423828, 0.0005211830139160156, 0.0006024837493896484, 0.0006837844848632812, 0.0007650852203369141, 0.0008463859558105469, 0.0009276866912841797, 0.0010089874267578125, 0.0010902881622314453, 0.0011715888977050781, 0.001252889633178711, 0.0013341903686523438, 0.0014154911041259766, 0.0014967918395996094, 0.0015780925750732422, 0.001659393310546875, 0.0017406940460205078, 0.0018219947814941406, 0.0019032955169677734, 0.0019845962524414062, 0.002065896987915039, 0.002147197723388672, 0.0022284984588623047, 0.0023097991943359375, 0.0023910999298095703, 0.002472400665283203, 0.002553701400756836, 0.0026350021362304688, 0.0027163028717041016, 0.0027976036071777344, 0.002878904342651367, 0.002960205078125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 10.0, 6.0, 9.0, 6.0, 10.0, 21.0, 37.0, 29.0, 50.0, 73.0, 81.0, 119.0, 187.0, 278.0, 441.0, 637.0, 980.0, 1766.0, 3230.0, 7416.0, 21703.0, 117494.0, 771908.0, 89520.0, 18646.0, 6497.0, 2996.0, 1571.0, 966.0, 601.0, 366.0, 255.0, 194.0, 139.0, 107.0, 64.0, 34.0, 25.0, 22.0, 17.0, 5.0, 13.0, 9.0, 12.0, 6.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-92.375, -89.4365234375, -86.498046875, -83.5595703125, -80.62109375, -77.6826171875, -74.744140625, -71.8056640625, -68.8671875, -65.9287109375, -62.990234375, -60.0517578125, -57.11328125, -54.1748046875, -51.236328125, -48.2978515625, -45.359375, -42.4208984375, -39.482421875, -36.5439453125, -33.60546875, -30.6669921875, -27.728515625, -24.7900390625, -21.8515625, -18.9130859375, -15.974609375, -13.0361328125, -10.09765625, -7.1591796875, -4.220703125, -1.2822265625, 1.65625, 4.5947265625, 7.533203125, 10.4716796875, 13.41015625, 16.3486328125, 19.287109375, 22.2255859375, 25.1640625, 28.1025390625, 31.041015625, 33.9794921875, 36.91796875, 39.8564453125, 42.794921875, 45.7333984375, 48.671875, 51.6103515625, 54.548828125, 57.4873046875, 60.42578125, 63.3642578125, 66.302734375, 69.2412109375, 72.1796875, 75.1181640625, 78.056640625, 80.9951171875, 83.93359375, 86.8720703125, 89.810546875, 92.7490234375, 95.6875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 3.0, 3.0, 0.0, 3.0, 9.0, 13.0, 24.0, 26.0, 54.0, 124.0, 171.0, 164.0, 146.0, 94.0, 65.0, 43.0, 19.0, 10.0, 9.0, 5.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.203125, -24.425537109375, -23.64794921875, -22.870361328125, -22.0927734375, -21.315185546875, -20.53759765625, -19.760009765625, -18.982421875, -18.204833984375, -17.42724609375, -16.649658203125, -15.8720703125, -15.094482421875, -14.31689453125, -13.539306640625, -12.76171875, -11.984130859375, -11.20654296875, -10.428955078125, -9.6513671875, -8.873779296875, -8.09619140625, -7.318603515625, -6.541015625, -5.763427734375, -4.98583984375, -4.208251953125, -3.4306640625, -2.653076171875, -1.87548828125, -1.097900390625, -0.3203125, 0.457275390625, 1.23486328125, 2.012451171875, 2.7900390625, 3.567626953125, 4.34521484375, 5.122802734375, 5.900390625, 6.677978515625, 7.45556640625, 8.233154296875, 9.0107421875, 9.788330078125, 10.56591796875, 11.343505859375, 12.12109375, 12.898681640625, 13.67626953125, 14.453857421875, 15.2314453125, 16.009033203125, 16.78662109375, 17.564208984375, 18.341796875, 19.119384765625, 19.89697265625, 20.674560546875, 21.4521484375, 22.229736328125, 23.00732421875, 23.784912109375, 24.5625]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 13.0, 6.0, 16.0, 20.0, 38.0, 38.0, 83.0, 115.0, 130.0, 124.0, 93.0, 72.0, 43.0, 42.0, 39.0, 21.0, 23.0, 18.0, 12.0, 6.0, 15.0, 2.0, 6.0, 4.0, 1.0, 6.0, 3.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.554726600646973, -14.7244873046875, -13.894248962402344, -13.064009666442871, -12.233771324157715, -11.403532028198242, -10.573293685913086, -9.743054389953613, -8.91281509399414, -8.082575798034668, -7.252337455749512, -6.422098159790039, -5.591859817504883, -4.76162052154541, -3.9313817024230957, -3.1011428833007812, -2.270904541015625, -1.4406657218933105, -0.6104267835617065, 0.21981215476989746, 1.050050973892212, 1.8802900314331055, 2.71052885055542, 3.5407676696777344, 4.371006488800049, 5.201245307922363, 6.031484127044678, 6.861722946166992, 7.691962242126465, 8.522201538085938, 9.352439880371094, 10.18267822265625, 11.012918472290039, 11.843157768249512, 12.673396110534668, 13.50363540649414, 14.333873748779297, 15.16411304473877, 15.994352340698242, 16.8245906829834, 17.654829025268555, 18.48506736755371, 19.3153076171875, 20.145545959472656, 20.975784301757812, 21.80602264404297, 22.636262893676758, 23.466501235961914, 24.296741485595703, 25.12697982788086, 25.95722007751465, 26.787458419799805, 27.61769676208496, 28.44793701171875, 29.278175354003906, 30.108413696289062, 30.93865203857422, 31.768890380859375, 32.59912872314453, 33.42936706542969, 34.25960922241211, 35.089847564697266, 35.92008590698242, 36.75032424926758, 37.580562591552734]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 1.0, 6.0, 10.0, 5.0, 7.0, 10.0, 14.0, 13.0, 11.0, 21.0, 16.0, 15.0, 31.0, 26.0, 19.0, 24.0, 36.0, 26.0, 40.0, 27.0, 26.0, 41.0, 28.0, 49.0, 42.0, 38.0, 41.0, 40.0, 34.0, 24.0, 26.0, 24.0, 30.0, 34.0, 21.0, 14.0, 17.0, 23.0, 12.0, 13.0, 7.0, 11.0, 16.0, 8.0, 5.0, 5.0, 3.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-13.678143501281738, -13.238385200500488, -12.798625946044922, -12.358867645263672, -11.919109344482422, -11.479350090026855, -11.039591789245605, -10.599832534790039, -10.160074234008789, -9.720315933227539, -9.280556678771973, -8.840798377990723, -8.401039123535156, -7.961280822753906, -7.521522521972656, -7.081763744354248, -6.64200496673584, -6.202246189117432, -5.762487411499023, -5.322729110717773, -4.882970333099365, -4.443211555480957, -4.003453254699707, -3.563694477081299, -3.1239356994628906, -2.6841769218444824, -2.2444183826446533, -1.8046597242355347, -1.364901065826416, -0.9251422882080078, -0.4853837490081787, -0.04562520980834961, 0.394134521484375, 0.8338931798934937, 1.2736518383026123, 1.713410496711731, 2.1531691551208496, 2.592927932739258, 3.032686471939087, 3.472445011138916, 3.912203788757324, 4.351962566375732, 4.791721343994141, 5.231479644775391, 5.671238422393799, 6.110997200012207, 6.550755500793457, 6.990514278411865, 7.430273056030273, 7.870031833648682, 8.30979061126709, 8.74954891204834, 9.189308166503906, 9.629066467285156, 10.068824768066406, 10.508583068847656, 10.948342323303223, 11.388100624084473, 11.827859878540039, 12.267618179321289, 12.707376480102539, 13.147135734558105, 13.586894035339355, 14.026653289794922, 14.466411590576172]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 10.0, 8.0, 9.0, 26.0, 27.0, 41.0, 73.0, 93.0, 162.0, 247.0, 396.0, 578.0, 867.0, 1397.0, 2375.0, 3764.0, 6365.0, 10829.0, 19148.0, 35911.0, 71432.0, 164541.0, 592940.0, 2120735.0, 794324.0, 196379.0, 81305.0, 39627.0, 20973.0, 11826.0, 6993.0, 4152.0, 2581.0, 1550.0, 945.0, 605.0, 371.0, 223.0, 145.0, 113.0, 71.0, 46.0, 33.0, 16.0, 9.0, 8.0, 5.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.59375, -22.8466796875, -22.099609375, -21.3525390625, -20.60546875, -19.8583984375, -19.111328125, -18.3642578125, -17.6171875, -16.8701171875, -16.123046875, -15.3759765625, -14.62890625, -13.8818359375, -13.134765625, -12.3876953125, -11.640625, -10.8935546875, -10.146484375, -9.3994140625, -8.65234375, -7.9052734375, -7.158203125, -6.4111328125, -5.6640625, -4.9169921875, -4.169921875, -3.4228515625, -2.67578125, -1.9287109375, -1.181640625, -0.4345703125, 0.3125, 1.0595703125, 1.806640625, 2.5537109375, 3.30078125, 4.0478515625, 4.794921875, 5.5419921875, 6.2890625, 7.0361328125, 7.783203125, 8.5302734375, 9.27734375, 10.0244140625, 10.771484375, 11.5185546875, 12.265625, 13.0126953125, 13.759765625, 14.5068359375, 15.25390625, 16.0009765625, 16.748046875, 17.4951171875, 18.2421875, 18.9892578125, 19.736328125, 20.4833984375, 21.23046875, 21.9775390625, 22.724609375, 23.4716796875, 24.21875]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 4.0, 2.0, 3.0, 5.0, 12.0, 9.0, 9.0, 9.0, 10.0, 21.0, 27.0, 26.0, 13.0, 29.0, 23.0, 29.0, 38.0, 37.0, 34.0, 45.0, 36.0, 42.0, 36.0, 43.0, 52.0, 38.0, 45.0, 36.0, 37.0, 45.0, 29.0, 21.0, 15.0, 29.0, 16.0, 20.0, 17.0, 9.0, 13.0, 11.0, 7.0, 7.0, 9.0, 3.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.75, -8.4735107421875, -8.197021484375, -7.9205322265625, -7.64404296875, -7.3675537109375, -7.091064453125, -6.8145751953125, -6.5380859375, -6.2615966796875, -5.985107421875, -5.7086181640625, -5.43212890625, -5.1556396484375, -4.879150390625, -4.6026611328125, -4.326171875, -4.0496826171875, -3.773193359375, -3.4967041015625, -3.22021484375, -2.9437255859375, -2.667236328125, -2.3907470703125, -2.1142578125, -1.8377685546875, -1.561279296875, -1.2847900390625, -1.00830078125, -0.7318115234375, -0.455322265625, -0.1788330078125, 0.09765625, 0.3741455078125, 0.650634765625, 0.9271240234375, 1.20361328125, 1.4801025390625, 1.756591796875, 2.0330810546875, 2.3095703125, 2.5860595703125, 2.862548828125, 3.1390380859375, 3.41552734375, 3.6920166015625, 3.968505859375, 4.2449951171875, 4.521484375, 4.7979736328125, 5.074462890625, 5.3509521484375, 5.62744140625, 5.9039306640625, 6.180419921875, 6.4569091796875, 6.7333984375, 7.0098876953125, 7.286376953125, 7.5628662109375, 7.83935546875, 8.1158447265625, 8.392333984375, 8.6688232421875, 8.9453125]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 9.0, 13.0, 19.0, 35.0, 34.0, 49.0, 87.0, 131.0, 202.0, 299.0, 411.0, 627.0, 937.0, 1435.0, 2184.0, 3499.0, 5580.0, 9196.0, 15000.0, 27148.0, 51646.0, 108384.0, 268341.0, 888772.0, 1873522.0, 565122.0, 192756.0, 82611.0, 40302.0, 22057.0, 12740.0, 7759.0, 4674.0, 3075.0, 1899.0, 1273.0, 783.0, 513.0, 397.0, 245.0, 178.0, 128.0, 72.0, 33.0, 36.0, 26.0, 20.0, 9.0, 9.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.21875, -17.63720703125, -17.0556640625, -16.47412109375, -15.892578125, -15.31103515625, -14.7294921875, -14.14794921875, -13.56640625, -12.98486328125, -12.4033203125, -11.82177734375, -11.240234375, -10.65869140625, -10.0771484375, -9.49560546875, -8.9140625, -8.33251953125, -7.7509765625, -7.16943359375, -6.587890625, -6.00634765625, -5.4248046875, -4.84326171875, -4.26171875, -3.68017578125, -3.0986328125, -2.51708984375, -1.935546875, -1.35400390625, -0.7724609375, -0.19091796875, 0.390625, 0.97216796875, 1.5537109375, 2.13525390625, 2.716796875, 3.29833984375, 3.8798828125, 4.46142578125, 5.04296875, 5.62451171875, 6.2060546875, 6.78759765625, 7.369140625, 7.95068359375, 8.5322265625, 9.11376953125, 9.6953125, 10.27685546875, 10.8583984375, 11.43994140625, 12.021484375, 12.60302734375, 13.1845703125, 13.76611328125, 14.34765625, 14.92919921875, 15.5107421875, 16.09228515625, 16.673828125, 17.25537109375, 17.8369140625, 18.41845703125, 19.0]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 5.0, 4.0, 5.0, 5.0, 7.0, 10.0, 14.0, 12.0, 20.0, 19.0, 29.0, 30.0, 48.0, 60.0, 75.0, 85.0, 82.0, 126.0, 181.0, 204.0, 252.0, 314.0, 345.0, 377.0, 319.0, 291.0, 234.0, 178.0, 140.0, 110.0, 78.0, 74.0, 64.0, 51.0, 51.0, 38.0, 27.0, 29.0, 20.0, 15.0, 12.0, 8.0, 9.0, 11.0, 7.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.03125, -4.87640380859375, -4.7215576171875, -4.56671142578125, -4.411865234375, -4.25701904296875, -4.1021728515625, -3.94732666015625, -3.79248046875, -3.63763427734375, -3.4827880859375, -3.32794189453125, -3.173095703125, -3.01824951171875, -2.8634033203125, -2.70855712890625, -2.5537109375, -2.39886474609375, -2.2440185546875, -2.08917236328125, -1.934326171875, -1.77947998046875, -1.6246337890625, -1.46978759765625, -1.31494140625, -1.16009521484375, -1.0052490234375, -0.85040283203125, -0.695556640625, -0.54071044921875, -0.3858642578125, -0.23101806640625, -0.076171875, 0.07867431640625, 0.2335205078125, 0.38836669921875, 0.543212890625, 0.69805908203125, 0.8529052734375, 1.00775146484375, 1.16259765625, 1.31744384765625, 1.4722900390625, 1.62713623046875, 1.781982421875, 1.93682861328125, 2.0916748046875, 2.24652099609375, 2.4013671875, 2.55621337890625, 2.7110595703125, 2.86590576171875, 3.020751953125, 3.17559814453125, 3.3304443359375, 3.48529052734375, 3.64013671875, 3.79498291015625, 3.9498291015625, 4.10467529296875, 4.259521484375, 4.41436767578125, 4.5692138671875, 4.72406005859375, 4.87890625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 4.0, 8.0, 9.0, 9.0, 9.0, 20.0, 30.0, 32.0, 74.0, 99.0, 143.0, 139.0, 131.0, 78.0, 52.0, 38.0, 33.0, 19.0, 13.0, 12.0, 13.0, 8.0, 6.0, 2.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.20258331298828, -15.572851181030273, -14.943119049072266, -14.313386917114258, -13.68365478515625, -13.053922653198242, -12.424189567565918, -11.79445743560791, -11.164725303649902, -10.534993171691895, -9.905261039733887, -9.275528907775879, -8.645795822143555, -8.016063690185547, -7.386331558227539, -6.756599426269531, -6.126867294311523, -5.497135162353516, -4.867403030395508, -4.237670421600342, -3.607938289642334, -2.978206157684326, -2.3484737873077393, -1.7187414169311523, -1.0890092849731445, -0.45927703380584717, 0.1704552173614502, 0.8001874685287476, 1.429919719696045, 2.0596518516540527, 2.6893842220306396, 3.3191165924072266, 3.9488487243652344, 4.578580856323242, 5.20831298828125, 5.838045597076416, 6.467777729034424, 7.097509860992432, 7.727242469787598, 8.356974601745605, 8.986706733703613, 9.616438865661621, 10.246170997619629, 10.875903129577637, 11.505636215209961, 12.135368347167969, 12.765100479125977, 13.394832611083984, 14.024564743041992, 14.654296875, 15.284029006958008, 15.913761138916016, 16.543493270874023, 17.17322540283203, 17.80295753479004, 18.432689666748047, 19.062423706054688, 19.692155838012695, 20.321887969970703, 20.95162010192871, 21.58135223388672, 22.211084365844727, 22.840816497802734, 23.470550537109375, 24.10028076171875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 1.0, 7.0, 1.0, 6.0, 8.0, 10.0, 9.0, 11.0, 16.0, 23.0, 16.0, 20.0, 27.0, 31.0, 27.0, 34.0, 36.0, 52.0, 41.0, 40.0, 46.0, 49.0, 41.0, 43.0, 39.0, 37.0, 42.0, 36.0, 30.0, 37.0, 31.0, 25.0, 27.0, 16.0, 20.0, 10.0, 12.0, 11.0, 11.0, 7.0, 1.0, 4.0, 7.0, 5.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.268240928649902, -9.914152145385742, -9.560063362121582, -9.205974578857422, -8.851885795593262, -8.497797012329102, -8.143707275390625, -7.789618968963623, -7.435530185699463, -7.081441402435303, -6.727352619171143, -6.373263359069824, -6.019174575805664, -5.665085792541504, -5.310997009277344, -4.956908226013184, -4.602819442749023, -4.248730659484863, -3.894641876220703, -3.540552854537964, -3.1864640712738037, -2.8323752880096436, -2.4782862663269043, -2.124197483062744, -1.770108699798584, -1.4160199165344238, -1.0619310140609741, -0.7078421115875244, -0.35375332832336426, 0.00033545494079589844, 0.35442447662353516, 0.7085132598876953, 1.062601089477539, 1.4166898727416992, 1.770778775215149, 2.1248676776885986, 2.478956460952759, 2.833045244216919, 3.187134265899658, 3.5412230491638184, 3.8953118324279785, 4.249400615692139, 4.603489398956299, 4.957578659057617, 5.311667442321777, 5.6657562255859375, 6.019845008850098, 6.373933792114258, 6.728022575378418, 7.082111358642578, 7.436200141906738, 7.790288925170898, 8.144377708435059, 8.498466491699219, 8.852556228637695, 9.206644058227539, 9.560733795166016, 9.914822578430176, 10.268911361694336, 10.623000144958496, 10.977088928222656, 11.331177711486816, 11.685266494750977, 12.039356231689453, 12.393444061279297]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 8.0, 6.0, 11.0, 25.0, 27.0, 45.0, 69.0, 101.0, 140.0, 208.0, 277.0, 449.0, 699.0, 1000.0, 1551.0, 2388.0, 3850.0, 6144.0, 10077.0, 17290.0, 30621.0, 59347.0, 125551.0, 290870.0, 260976.0, 113340.0, 54210.0, 28319.0, 15925.0, 9436.0, 5652.0, 3391.0, 2230.0, 1471.0, 962.0, 628.0, 398.0, 288.0, 176.0, 126.0, 74.0, 63.0, 38.0, 33.0, 25.0, 21.0, 8.0, 3.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5859375, -8.308349609375, -8.03076171875, -7.753173828125, -7.4755859375, -7.197998046875, -6.92041015625, -6.642822265625, -6.365234375, -6.087646484375, -5.81005859375, -5.532470703125, -5.2548828125, -4.977294921875, -4.69970703125, -4.422119140625, -4.14453125, -3.866943359375, -3.58935546875, -3.311767578125, -3.0341796875, -2.756591796875, -2.47900390625, -2.201416015625, -1.923828125, -1.646240234375, -1.36865234375, -1.091064453125, -0.8134765625, -0.535888671875, -0.25830078125, 0.019287109375, 0.296875, 0.574462890625, 0.85205078125, 1.129638671875, 1.4072265625, 1.684814453125, 1.96240234375, 2.239990234375, 2.517578125, 2.795166015625, 3.07275390625, 3.350341796875, 3.6279296875, 3.905517578125, 4.18310546875, 4.460693359375, 4.73828125, 5.015869140625, 5.29345703125, 5.571044921875, 5.8486328125, 6.126220703125, 6.40380859375, 6.681396484375, 6.958984375, 7.236572265625, 7.51416015625, 7.791748046875, 8.0693359375, 8.346923828125, 8.62451171875, 8.902099609375, 9.1796875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 11.0, 13.0, 8.0, 8.0, 14.0, 15.0, 19.0, 27.0, 27.0, 18.0, 24.0, 34.0, 36.0, 41.0, 55.0, 36.0, 44.0, 49.0, 52.0, 45.0, 43.0, 45.0, 35.0, 49.0, 29.0, 28.0, 29.0, 29.0, 24.0, 21.0, 13.0, 12.0, 13.0, 10.0, 12.0, 4.0, 9.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7109375, -9.35498046875, -8.9990234375, -8.64306640625, -8.287109375, -7.93115234375, -7.5751953125, -7.21923828125, -6.86328125, -6.50732421875, -6.1513671875, -5.79541015625, -5.439453125, -5.08349609375, -4.7275390625, -4.37158203125, -4.015625, -3.65966796875, -3.3037109375, -2.94775390625, -2.591796875, -2.23583984375, -1.8798828125, -1.52392578125, -1.16796875, -0.81201171875, -0.4560546875, -0.10009765625, 0.255859375, 0.61181640625, 0.9677734375, 1.32373046875, 1.6796875, 2.03564453125, 2.3916015625, 2.74755859375, 3.103515625, 3.45947265625, 3.8154296875, 4.17138671875, 4.52734375, 4.88330078125, 5.2392578125, 5.59521484375, 5.951171875, 6.30712890625, 6.6630859375, 7.01904296875, 7.375, 7.73095703125, 8.0869140625, 8.44287109375, 8.798828125, 9.15478515625, 9.5107421875, 9.86669921875, 10.22265625, 10.57861328125, 10.9345703125, 11.29052734375, 11.646484375, 12.00244140625, 12.3583984375, 12.71435546875, 13.0703125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 6.0, 7.0, 13.0, 11.0, 15.0, 23.0, 38.0, 50.0, 77.0, 106.0, 168.0, 268.0, 363.0, 522.0, 827.0, 1333.0, 2014.0, 3184.0, 5352.0, 10111.0, 20766.0, 53036.0, 192177.0, 542074.0, 135745.0, 41918.0, 17054.0, 8369.0, 4750.0, 2822.0, 1830.0, 1194.0, 777.0, 524.0, 317.0, 219.0, 161.0, 102.0, 79.0, 50.0, 25.0, 24.0, 15.0, 16.0, 14.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-13.765625, -13.353271484375, -12.94091796875, -12.528564453125, -12.1162109375, -11.703857421875, -11.29150390625, -10.879150390625, -10.466796875, -10.054443359375, -9.64208984375, -9.229736328125, -8.8173828125, -8.405029296875, -7.99267578125, -7.580322265625, -7.16796875, -6.755615234375, -6.34326171875, -5.930908203125, -5.5185546875, -5.106201171875, -4.69384765625, -4.281494140625, -3.869140625, -3.456787109375, -3.04443359375, -2.632080078125, -2.2197265625, -1.807373046875, -1.39501953125, -0.982666015625, -0.5703125, -0.157958984375, 0.25439453125, 0.666748046875, 1.0791015625, 1.491455078125, 1.90380859375, 2.316162109375, 2.728515625, 3.140869140625, 3.55322265625, 3.965576171875, 4.3779296875, 4.790283203125, 5.20263671875, 5.614990234375, 6.02734375, 6.439697265625, 6.85205078125, 7.264404296875, 7.6767578125, 8.089111328125, 8.50146484375, 8.913818359375, 9.326171875, 9.738525390625, 10.15087890625, 10.563232421875, 10.9755859375, 11.387939453125, 11.80029296875, 12.212646484375, 12.625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 2.0, 7.0, 6.0, 13.0, 14.0, 14.0, 17.0, 15.0, 25.0, 27.0, 27.0, 36.0, 49.0, 40.0, 38.0, 38.0, 33.0, 49.0, 54.0, 44.0, 49.0, 37.0, 47.0, 40.0, 45.0, 36.0, 35.0, 24.0, 22.0, 22.0, 19.0, 10.0, 14.0, 12.0, 15.0, 7.0, 4.0, 6.0, 8.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.2890625, -8.031494140625, -7.77392578125, -7.516357421875, -7.2587890625, -7.001220703125, -6.74365234375, -6.486083984375, -6.228515625, -5.970947265625, -5.71337890625, -5.455810546875, -5.1982421875, -4.940673828125, -4.68310546875, -4.425537109375, -4.16796875, -3.910400390625, -3.65283203125, -3.395263671875, -3.1376953125, -2.880126953125, -2.62255859375, -2.364990234375, -2.107421875, -1.849853515625, -1.59228515625, -1.334716796875, -1.0771484375, -0.819580078125, -0.56201171875, -0.304443359375, -0.046875, 0.210693359375, 0.46826171875, 0.725830078125, 0.9833984375, 1.240966796875, 1.49853515625, 1.756103515625, 2.013671875, 2.271240234375, 2.52880859375, 2.786376953125, 3.0439453125, 3.301513671875, 3.55908203125, 3.816650390625, 4.07421875, 4.331787109375, 4.58935546875, 4.846923828125, 5.1044921875, 5.362060546875, 5.61962890625, 5.877197265625, 6.134765625, 6.392333984375, 6.64990234375, 6.907470703125, 7.1650390625, 7.422607421875, 7.68017578125, 7.937744140625, 8.1953125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 7.0, 7.0, 15.0, 16.0, 17.0, 28.0, 36.0, 53.0, 63.0, 103.0, 161.0, 236.0, 372.0, 542.0, 862.0, 1380.0, 2488.0, 4432.0, 8693.0, 20382.0, 65845.0, 606179.0, 260245.0, 44500.0, 15497.0, 7169.0, 3662.0, 2158.0, 1181.0, 724.0, 481.0, 314.0, 226.0, 155.0, 100.0, 76.0, 35.0, 37.0, 27.0, 12.0, 16.0, 11.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.431640625, -2.350189208984375, -2.26873779296875, -2.187286376953125, -2.1058349609375, -2.024383544921875, -1.94293212890625, -1.861480712890625, -1.780029296875, -1.698577880859375, -1.61712646484375, -1.535675048828125, -1.4542236328125, -1.372772216796875, -1.29132080078125, -1.209869384765625, -1.12841796875, -1.046966552734375, -0.96551513671875, -0.884063720703125, -0.8026123046875, -0.721160888671875, -0.63970947265625, -0.558258056640625, -0.476806640625, -0.395355224609375, -0.31390380859375, -0.232452392578125, -0.1510009765625, -0.069549560546875, 0.01190185546875, 0.093353271484375, 0.1748046875, 0.256256103515625, 0.33770751953125, 0.419158935546875, 0.5006103515625, 0.582061767578125, 0.66351318359375, 0.744964599609375, 0.826416015625, 0.907867431640625, 0.98931884765625, 1.070770263671875, 1.1522216796875, 1.233673095703125, 1.31512451171875, 1.396575927734375, 1.47802734375, 1.559478759765625, 1.64093017578125, 1.722381591796875, 1.8038330078125, 1.885284423828125, 1.96673583984375, 2.048187255859375, 2.129638671875, 2.211090087890625, 2.29254150390625, 2.373992919921875, 2.4554443359375, 2.536895751953125, 2.61834716796875, 2.699798583984375, 2.78125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 9.0, 14.0, 23.0, 33.0, 57.0, 71.0, 111.0, 171.0, 167.0, 102.0, 75.0, 50.0, 32.0, 31.0, 15.0, 12.0, 2.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-0.00028896331787109375, -0.0002825409173965454, -0.00027611851692199707, -0.00026969611644744873, -0.0002632737159729004, -0.00025685131549835205, -0.0002504289150238037, -0.00024400651454925537, -0.00023758411407470703, -0.0002311617136001587, -0.00022473931312561035, -0.000218316912651062, -0.00021189451217651367, -0.00020547211170196533, -0.000199049711227417, -0.00019262731075286865, -0.0001862049102783203, -0.00017978250980377197, -0.00017336010932922363, -0.0001669377088546753, -0.00016051530838012695, -0.0001540929079055786, -0.00014767050743103027, -0.00014124810695648193, -0.0001348257064819336, -0.00012840330600738525, -0.00012198090553283691, -0.00011555850505828857, -0.00010913610458374023, -0.0001027137041091919, -9.629130363464355e-05, -8.986890316009521e-05, -8.344650268554688e-05, -7.702410221099854e-05, -7.06017017364502e-05, -6.417930126190186e-05, -5.7756900787353516e-05, -5.1334500312805176e-05, -4.4912099838256836e-05, -3.8489699363708496e-05, -3.2067298889160156e-05, -2.5644898414611816e-05, -1.9222497940063477e-05, -1.2800097465515137e-05, -6.377696990966797e-06, 4.470348358154297e-08, 6.467103958129883e-06, 1.2889504432678223e-05, 1.9311904907226562e-05, 2.5734305381774902e-05, 3.215670585632324e-05, 3.857910633087158e-05, 4.500150680541992e-05, 5.142390727996826e-05, 5.78463077545166e-05, 6.426870822906494e-05, 7.069110870361328e-05, 7.711350917816162e-05, 8.353590965270996e-05, 8.99583101272583e-05, 9.638071060180664e-05, 0.00010280311107635498, 0.00010922551155090332, 0.00011564791202545166, 0.0001220703125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 5.0, 6.0, 3.0, 4.0, 13.0, 10.0, 13.0, 23.0, 24.0, 32.0, 67.0, 74.0, 100.0, 145.0, 205.0, 275.0, 483.0, 607.0, 920.0, 1374.0, 2021.0, 3171.0, 4918.0, 7838.0, 13622.0, 24372.0, 50691.0, 138656.0, 549692.0, 138291.0, 50534.0, 24567.0, 13443.0, 7934.0, 4893.0, 3098.0, 2037.0, 1384.0, 936.0, 620.0, 437.0, 281.0, 223.0, 148.0, 108.0, 71.0, 53.0, 36.0, 25.0, 23.0, 12.0, 14.0, 14.0, 8.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-3.619140625, -3.504241943359375, -3.38934326171875, -3.274444580078125, -3.1595458984375, -3.044647216796875, -2.92974853515625, -2.814849853515625, -2.699951171875, -2.585052490234375, -2.47015380859375, -2.355255126953125, -2.2403564453125, -2.125457763671875, -2.01055908203125, -1.895660400390625, -1.78076171875, -1.665863037109375, -1.55096435546875, -1.436065673828125, -1.3211669921875, -1.206268310546875, -1.09136962890625, -0.976470947265625, -0.861572265625, -0.746673583984375, -0.63177490234375, -0.516876220703125, -0.4019775390625, -0.287078857421875, -0.17218017578125, -0.057281494140625, 0.0576171875, 0.172515869140625, 0.28741455078125, 0.402313232421875, 0.5172119140625, 0.632110595703125, 0.74700927734375, 0.861907958984375, 0.976806640625, 1.091705322265625, 1.20660400390625, 1.321502685546875, 1.4364013671875, 1.551300048828125, 1.66619873046875, 1.781097412109375, 1.89599609375, 2.010894775390625, 2.12579345703125, 2.240692138671875, 2.3555908203125, 2.470489501953125, 2.58538818359375, 2.700286865234375, 2.815185546875, 2.930084228515625, 3.04498291015625, 3.159881591796875, 3.2747802734375, 3.389678955078125, 3.50457763671875, 3.619476318359375, 3.734375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 4.0, 7.0, 8.0, 16.0, 13.0, 18.0, 12.0, 20.0, 23.0, 38.0, 37.0, 43.0, 57.0, 81.0, 130.0, 102.0, 81.0, 58.0, 36.0, 35.0, 27.0, 25.0, 26.0, 18.0, 13.0, 15.0, 10.0, 13.0, 5.0, 9.0, 1.0, 3.0, 6.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0654296875, -1.0308990478515625, -0.996368408203125, -0.9618377685546875, -0.92730712890625, -0.8927764892578125, -0.858245849609375, -0.8237152099609375, -0.7891845703125, -0.7546539306640625, -0.720123291015625, -0.6855926513671875, -0.65106201171875, -0.6165313720703125, -0.582000732421875, -0.5474700927734375, -0.512939453125, -0.4784088134765625, -0.443878173828125, -0.4093475341796875, -0.37481689453125, -0.3402862548828125, -0.305755615234375, -0.2712249755859375, -0.2366943359375, -0.2021636962890625, -0.167633056640625, -0.1331024169921875, -0.09857177734375, -0.0640411376953125, -0.029510498046875, 0.0050201416015625, 0.03955078125, 0.0740814208984375, 0.108612060546875, 0.1431427001953125, 0.17767333984375, 0.2122039794921875, 0.246734619140625, 0.2812652587890625, 0.3157958984375, 0.3503265380859375, 0.384857177734375, 0.4193878173828125, 0.45391845703125, 0.4884490966796875, 0.522979736328125, 0.5575103759765625, 0.592041015625, 0.6265716552734375, 0.661102294921875, 0.6956329345703125, 0.73016357421875, 0.7646942138671875, 0.799224853515625, 0.8337554931640625, 0.8682861328125, 0.9028167724609375, 0.937347412109375, 0.9718780517578125, 1.00640869140625, 1.0409393310546875, 1.075469970703125, 1.1100006103515625, 1.14453125]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 8.0, 5.0, 7.0, 5.0, 14.0, 11.0, 14.0, 31.0, 41.0, 53.0, 86.0, 121.0, 157.0, 119.0, 87.0, 52.0, 41.0, 39.0, 26.0, 13.0, 9.0, 10.0, 12.0, 10.0, 7.0, 5.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.956852912902832, -13.393542289733887, -12.830231666564941, -12.266921043395996, -11.703609466552734, -11.140298843383789, -10.576988220214844, -10.013677597045898, -9.450366973876953, -8.887056350708008, -8.323745727539062, -7.760434627532959, -7.197124004364014, -6.633813381195068, -6.070502281188965, -5.5071916580200195, -4.943881034851074, -4.380570411682129, -3.8172595500946045, -3.25394868850708, -2.6906380653381348, -2.1273274421691895, -1.564016580581665, -1.0007057189941406, -0.4373950958251953, 0.12591564655303955, 0.6892263889312744, 1.2525371313095093, 1.8158478736877441, 2.3791584968566895, 2.942469358444214, 3.5057802200317383, 4.069091796875, 4.632402420043945, 5.195713043212891, 5.759024143218994, 6.3223347663879395, 6.885645389556885, 7.448956489562988, 8.012267112731934, 8.575577735900879, 9.138888359069824, 9.70219898223877, 10.265509605407715, 10.828821182250977, 11.392131805419922, 11.955442428588867, 12.518753051757812, 13.082063674926758, 13.645374298095703, 14.208684921264648, 14.771995544433594, 15.335306167602539, 15.898616790771484, 16.46192741394043, 17.025238037109375, 17.588550567626953, 18.1518611907959, 18.715171813964844, 19.27848243713379, 19.841793060302734, 20.40510368347168, 20.968414306640625, 21.531726837158203, 22.095035552978516]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 4.0, 1.0, 6.0, 8.0, 11.0, 15.0, 11.0, 13.0, 13.0, 26.0, 21.0, 20.0, 38.0, 24.0, 36.0, 33.0, 49.0, 39.0, 42.0, 48.0, 45.0, 34.0, 43.0, 56.0, 40.0, 32.0, 40.0, 30.0, 26.0, 32.0, 32.0, 17.0, 14.0, 22.0, 15.0, 14.0, 6.0, 14.0, 11.0, 5.0, 2.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.061328887939453, -9.713666915893555, -9.366004943847656, -9.018342971801758, -8.670681953430176, -8.323019981384277, -7.975358009338379, -7.6276960372924805, -7.280034065246582, -6.932372093200684, -6.584710597991943, -6.237048625946045, -5.8893866539001465, -5.541725158691406, -5.194063186645508, -4.846401214599609, -4.498739719390869, -4.151077747344971, -3.8034160137176514, -3.455754280090332, -3.1080923080444336, -2.7604305744171143, -2.412768840789795, -2.0651068687438965, -1.7174451351165771, -1.3697832822799683, -1.0221214294433594, -0.67445969581604, -0.32679784297943115, 0.020864009857177734, 0.36852574348449707, 0.7161877155303955, 1.0638494491577148, 1.4115113019943237, 1.7591731548309326, 2.106834888458252, 2.4544968605041504, 2.8021585941314697, 3.149820327758789, 3.4974822998046875, 3.845144033432007, 4.192805767059326, 4.540467739105225, 4.888129234313965, 5.235791206359863, 5.583453178405762, 5.93111515045166, 6.278777122497559, 6.626438617706299, 6.974100589752197, 7.3217620849609375, 7.669424057006836, 8.017086029052734, 8.364748001098633, 8.712409973144531, 9.06007194519043, 9.407732963562012, 9.75539493560791, 10.103056907653809, 10.45071792602539, 10.798379898071289, 11.146041870117188, 11.493703842163086, 11.841365814208984, 12.189027786254883]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 16.0, 18.0, 25.0, 30.0, 62.0, 69.0, 87.0, 134.0, 186.0, 288.0, 487.0, 659.0, 944.0, 1424.0, 2324.0, 3483.0, 5480.0, 8776.0, 14696.0, 24420.0, 41237.0, 72188.0, 127290.0, 207810.0, 214521.0, 134540.0, 76781.0, 43591.0, 25850.0, 15458.0, 9367.0, 5676.0, 3679.0, 2309.0, 1504.0, 1038.0, 676.0, 465.0, 318.0, 207.0, 126.0, 101.0, 59.0, 54.0, 28.0, 20.0, 15.0, 11.0, 11.0, 5.0, 6.0, 2.0, 0.0, 4.0, 0.0, 1.0], "bins": [-14.5234375, -14.0703125, -13.6171875, -13.1640625, -12.7109375, -12.2578125, -11.8046875, -11.3515625, -10.8984375, -10.4453125, -9.9921875, -9.5390625, -9.0859375, -8.6328125, -8.1796875, -7.7265625, -7.2734375, -6.8203125, -6.3671875, -5.9140625, -5.4609375, -5.0078125, -4.5546875, -4.1015625, -3.6484375, -3.1953125, -2.7421875, -2.2890625, -1.8359375, -1.3828125, -0.9296875, -0.4765625, -0.0234375, 0.4296875, 0.8828125, 1.3359375, 1.7890625, 2.2421875, 2.6953125, 3.1484375, 3.6015625, 4.0546875, 4.5078125, 4.9609375, 5.4140625, 5.8671875, 6.3203125, 6.7734375, 7.2265625, 7.6796875, 8.1328125, 8.5859375, 9.0390625, 9.4921875, 9.9453125, 10.3984375, 10.8515625, 11.3046875, 11.7578125, 12.2109375, 12.6640625, 13.1171875, 13.5703125, 14.0234375, 14.4765625]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 6.0, 3.0, 7.0, 13.0, 16.0, 7.0, 14.0, 12.0, 19.0, 20.0, 23.0, 28.0, 31.0, 40.0, 32.0, 41.0, 52.0, 47.0, 44.0, 42.0, 38.0, 43.0, 44.0, 48.0, 31.0, 45.0, 28.0, 32.0, 31.0, 23.0, 16.0, 29.0, 12.0, 14.0, 15.0, 22.0, 7.0, 8.0, 6.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.796875, -9.4822998046875, -9.167724609375, -8.8531494140625, -8.53857421875, -8.2239990234375, -7.909423828125, -7.5948486328125, -7.2802734375, -6.9656982421875, -6.651123046875, -6.3365478515625, -6.02197265625, -5.7073974609375, -5.392822265625, -5.0782470703125, -4.763671875, -4.4490966796875, -4.134521484375, -3.8199462890625, -3.50537109375, -3.1907958984375, -2.876220703125, -2.5616455078125, -2.2470703125, -1.9324951171875, -1.617919921875, -1.3033447265625, -0.98876953125, -0.6741943359375, -0.359619140625, -0.0450439453125, 0.26953125, 0.5841064453125, 0.898681640625, 1.2132568359375, 1.52783203125, 1.8424072265625, 2.156982421875, 2.4715576171875, 2.7861328125, 3.1007080078125, 3.415283203125, 3.7298583984375, 4.04443359375, 4.3590087890625, 4.673583984375, 4.9881591796875, 5.302734375, 5.6173095703125, 5.931884765625, 6.2464599609375, 6.56103515625, 6.8756103515625, 7.190185546875, 7.5047607421875, 7.8193359375, 8.1339111328125, 8.448486328125, 8.7630615234375, 9.07763671875, 9.3922119140625, 9.706787109375, 10.0213623046875, 10.3359375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 4.0, 13.0, 26.0, 21.0, 32.0, 49.0, 74.0, 90.0, 160.0, 270.0, 338.0, 511.0, 858.0, 1338.0, 2125.0, 3511.0, 5902.0, 9810.0, 17316.0, 31808.0, 59479.0, 116760.0, 243690.0, 271760.0, 133180.0, 66695.0, 35460.0, 19589.0, 11086.0, 6165.0, 3822.0, 2476.0, 1452.0, 953.0, 591.0, 397.0, 262.0, 155.0, 98.0, 71.0, 54.0, 26.0, 19.0, 14.0, 14.0, 8.0, 7.0, 8.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-18.484375, -17.92578125, -17.3671875, -16.80859375, -16.25, -15.69140625, -15.1328125, -14.57421875, -14.015625, -13.45703125, -12.8984375, -12.33984375, -11.78125, -11.22265625, -10.6640625, -10.10546875, -9.546875, -8.98828125, -8.4296875, -7.87109375, -7.3125, -6.75390625, -6.1953125, -5.63671875, -5.078125, -4.51953125, -3.9609375, -3.40234375, -2.84375, -2.28515625, -1.7265625, -1.16796875, -0.609375, -0.05078125, 0.5078125, 1.06640625, 1.625, 2.18359375, 2.7421875, 3.30078125, 3.859375, 4.41796875, 4.9765625, 5.53515625, 6.09375, 6.65234375, 7.2109375, 7.76953125, 8.328125, 8.88671875, 9.4453125, 10.00390625, 10.5625, 11.12109375, 11.6796875, 12.23828125, 12.796875, 13.35546875, 13.9140625, 14.47265625, 15.03125, 15.58984375, 16.1484375, 16.70703125, 17.265625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 3.0, 9.0, 10.0, 9.0, 5.0, 6.0, 17.0, 16.0, 13.0, 34.0, 18.0, 21.0, 18.0, 32.0, 36.0, 41.0, 42.0, 25.0, 25.0, 44.0, 37.0, 40.0, 41.0, 52.0, 38.0, 25.0, 40.0, 30.0, 39.0, 30.0, 39.0, 22.0, 19.0, 20.0, 11.0, 26.0, 11.0, 9.0, 16.0, 8.0, 11.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.7421875, -6.52178955078125, -6.3013916015625, -6.08099365234375, -5.860595703125, -5.64019775390625, -5.4197998046875, -5.19940185546875, -4.97900390625, -4.75860595703125, -4.5382080078125, -4.31781005859375, -4.097412109375, -3.87701416015625, -3.6566162109375, -3.43621826171875, -3.2158203125, -2.99542236328125, -2.7750244140625, -2.55462646484375, -2.334228515625, -2.11383056640625, -1.8934326171875, -1.67303466796875, -1.45263671875, -1.23223876953125, -1.0118408203125, -0.79144287109375, -0.571044921875, -0.35064697265625, -0.1302490234375, 0.09014892578125, 0.310546875, 0.53094482421875, 0.7513427734375, 0.97174072265625, 1.192138671875, 1.41253662109375, 1.6329345703125, 1.85333251953125, 2.07373046875, 2.29412841796875, 2.5145263671875, 2.73492431640625, 2.955322265625, 3.17572021484375, 3.3961181640625, 3.61651611328125, 3.8369140625, 4.05731201171875, 4.2777099609375, 4.49810791015625, 4.718505859375, 4.93890380859375, 5.1593017578125, 5.37969970703125, 5.60009765625, 5.82049560546875, 6.0408935546875, 6.26129150390625, 6.481689453125, 6.70208740234375, 6.9224853515625, 7.14288330078125, 7.36328125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 7.0, 11.0, 9.0, 14.0, 20.0, 46.0, 51.0, 67.0, 130.0, 173.0, 254.0, 376.0, 562.0, 897.0, 1367.0, 2272.0, 3608.0, 6521.0, 12841.0, 28579.0, 78993.0, 590001.0, 219710.0, 56047.0, 21802.0, 10160.0, 5531.0, 3137.0, 1859.0, 1199.0, 769.0, 518.0, 333.0, 216.0, 148.0, 103.0, 62.0, 55.0, 38.0, 16.0, 19.0, 10.0, 9.0, 7.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.890625, -30.856689453125, -29.82275390625, -28.788818359375, -27.7548828125, -26.720947265625, -25.68701171875, -24.653076171875, -23.619140625, -22.585205078125, -21.55126953125, -20.517333984375, -19.4833984375, -18.449462890625, -17.41552734375, -16.381591796875, -15.34765625, -14.313720703125, -13.27978515625, -12.245849609375, -11.2119140625, -10.177978515625, -9.14404296875, -8.110107421875, -7.076171875, -6.042236328125, -5.00830078125, -3.974365234375, -2.9404296875, -1.906494140625, -0.87255859375, 0.161376953125, 1.1953125, 2.229248046875, 3.26318359375, 4.297119140625, 5.3310546875, 6.364990234375, 7.39892578125, 8.432861328125, 9.466796875, 10.500732421875, 11.53466796875, 12.568603515625, 13.6025390625, 14.636474609375, 15.67041015625, 16.704345703125, 17.73828125, 18.772216796875, 19.80615234375, 20.840087890625, 21.8740234375, 22.907958984375, 23.94189453125, 24.975830078125, 26.009765625, 27.043701171875, 28.07763671875, 29.111572265625, 30.1455078125, 31.179443359375, 32.21337890625, 33.247314453125, 34.28125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 1.0, 1.0, 2.0, 6.0, 8.0, 8.0, 10.0, 16.0, 31.0, 49.0, 46.0, 45.0, 84.0, 155.0, 188.0, 80.0, 77.0, 43.0, 48.0, 29.0, 20.0, 14.0, 13.0, 6.0, 3.0, 4.0, 3.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0010814666748046875, -0.001049727201461792, -0.0010179877281188965, -0.000986248254776001, -0.0009545087814331055, -0.00092276930809021, -0.0008910298347473145, -0.0008592903614044189, -0.0008275508880615234, -0.0007958114147186279, -0.0007640719413757324, -0.0007323324680328369, -0.0007005929946899414, -0.0006688535213470459, -0.0006371140480041504, -0.0006053745746612549, -0.0005736351013183594, -0.0005418956279754639, -0.0005101561546325684, -0.00047841668128967285, -0.00044667720794677734, -0.00041493773460388184, -0.00038319826126098633, -0.0003514587879180908, -0.0003197193145751953, -0.0002879798412322998, -0.0002562403678894043, -0.0002245008945465088, -0.00019276142120361328, -0.00016102194786071777, -0.00012928247451782227, -9.754300117492676e-05, -6.580352783203125e-05, -3.406405448913574e-05, -2.3245811462402344e-06, 2.9414892196655273e-05, 6.115436553955078e-05, 9.289383888244629e-05, 0.0001246333122253418, 0.0001563727855682373, 0.0001881122589111328, 0.00021985173225402832, 0.00025159120559692383, 0.00028333067893981934, 0.00031507015228271484, 0.00034680962562561035, 0.00037854909896850586, 0.00041028857231140137, 0.0004420280456542969, 0.0004737675189971924, 0.0005055069923400879, 0.0005372464656829834, 0.0005689859390258789, 0.0006007254123687744, 0.0006324648857116699, 0.0006642043590545654, 0.0006959438323974609, 0.0007276833057403564, 0.000759422779083252, 0.0007911622524261475, 0.000822901725769043, 0.0008546411991119385, 0.000886380672454834, 0.0009181201457977295, 0.000949859619140625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 0.0, 7.0, 6.0, 12.0, 17.0, 23.0, 32.0, 37.0, 46.0, 63.0, 107.0, 148.0, 167.0, 252.0, 389.0, 543.0, 762.0, 1109.0, 1720.0, 2790.0, 4623.0, 8501.0, 17600.0, 44743.0, 184912.0, 643663.0, 80911.0, 27089.0, 11881.0, 6191.0, 3530.0, 2225.0, 1331.0, 969.0, 631.0, 417.0, 334.0, 223.0, 149.0, 100.0, 85.0, 59.0, 50.0, 36.0, 23.0, 16.0, 15.0, 6.0, 7.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-30.171875, -29.206298828125, -28.24072265625, -27.275146484375, -26.3095703125, -25.343994140625, -24.37841796875, -23.412841796875, -22.447265625, -21.481689453125, -20.51611328125, -19.550537109375, -18.5849609375, -17.619384765625, -16.65380859375, -15.688232421875, -14.72265625, -13.757080078125, -12.79150390625, -11.825927734375, -10.8603515625, -9.894775390625, -8.92919921875, -7.963623046875, -6.998046875, -6.032470703125, -5.06689453125, -4.101318359375, -3.1357421875, -2.170166015625, -1.20458984375, -0.239013671875, 0.7265625, 1.692138671875, 2.65771484375, 3.623291015625, 4.5888671875, 5.554443359375, 6.52001953125, 7.485595703125, 8.451171875, 9.416748046875, 10.38232421875, 11.347900390625, 12.3134765625, 13.279052734375, 14.24462890625, 15.210205078125, 16.17578125, 17.141357421875, 18.10693359375, 19.072509765625, 20.0380859375, 21.003662109375, 21.96923828125, 22.934814453125, 23.900390625, 24.865966796875, 25.83154296875, 26.797119140625, 27.7626953125, 28.728271484375, 29.69384765625, 30.659423828125, 31.625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 6.0, 3.0, 3.0, 4.0, 7.0, 6.0, 8.0, 11.0, 23.0, 27.0, 29.0, 48.0, 63.0, 62.0, 65.0, 225.0, 75.0, 79.0, 61.0, 43.0, 25.0, 28.0, 24.0, 9.0, 14.0, 11.0, 6.0, 5.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-8.25, -8.01312255859375, -7.7762451171875, -7.53936767578125, -7.302490234375, -7.06561279296875, -6.8287353515625, -6.59185791015625, -6.35498046875, -6.11810302734375, -5.8812255859375, -5.64434814453125, -5.407470703125, -5.17059326171875, -4.9337158203125, -4.69683837890625, -4.4599609375, -4.22308349609375, -3.9862060546875, -3.74932861328125, -3.512451171875, -3.27557373046875, -3.0386962890625, -2.80181884765625, -2.56494140625, -2.32806396484375, -2.0911865234375, -1.85430908203125, -1.617431640625, -1.38055419921875, -1.1436767578125, -0.90679931640625, -0.669921875, -0.43304443359375, -0.1961669921875, 0.04071044921875, 0.277587890625, 0.51446533203125, 0.7513427734375, 0.98822021484375, 1.22509765625, 1.46197509765625, 1.6988525390625, 1.93572998046875, 2.172607421875, 2.40948486328125, 2.6463623046875, 2.88323974609375, 3.1201171875, 3.35699462890625, 3.5938720703125, 3.83074951171875, 4.067626953125, 4.30450439453125, 4.5413818359375, 4.77825927734375, 5.01513671875, 5.25201416015625, 5.4888916015625, 5.72576904296875, 5.962646484375, 6.19952392578125, 6.4364013671875, 6.67327880859375, 6.91015625]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 3.0, 16.0, 17.0, 20.0, 26.0, 46.0, 71.0, 91.0, 168.0, 142.0, 100.0, 66.0, 69.0, 34.0, 32.0, 19.0, 13.0, 7.0, 12.0, 5.0, 9.0, 2.0, 4.0, 4.0, 6.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.714938163757324, -13.143060684204102, -12.571183204650879, -11.999305725097656, -11.42742919921875, -10.855551719665527, -10.283674240112305, -9.711797714233398, -9.13991928100586, -8.568041801452637, -7.996164798736572, -7.42428731918335, -6.852410316467285, -6.2805328369140625, -5.70865535736084, -5.136778354644775, -4.564901351928711, -3.9930241107940674, -3.421146869659424, -2.849269390106201, -2.2773921489715576, -1.705514907836914, -1.1336374282836914, -0.561760425567627, 0.010117053985595703, 0.581994354724884, 1.1538716554641724, 1.7257490158081055, 2.297626256942749, 2.8695034980773926, 3.4413809776306152, 4.01325798034668, 4.585136413574219, 5.157013893127441, 5.728890895843506, 6.3007683753967285, 6.872645378112793, 7.444522857666016, 8.016400337219238, 8.588277816772461, 9.160154342651367, 9.73203182220459, 10.303909301757812, 10.875785827636719, 11.447663307189941, 12.019540786743164, 12.591418266296387, 13.16329574584961, 13.735173225402832, 14.307050704956055, 14.878928184509277, 15.4508056640625, 16.022682189941406, 16.594558715820312, 17.16643714904785, 17.738313674926758, 18.310192108154297, 18.882068634033203, 19.453947067260742, 20.02582359313965, 20.597702026367188, 21.169578552246094, 21.741455078125, 22.31333351135254, 22.885210037231445]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 6.0, 2.0, 3.0, 9.0, 6.0, 14.0, 7.0, 6.0, 18.0, 15.0, 17.0, 15.0, 25.0, 17.0, 30.0, 31.0, 48.0, 39.0, 37.0, 44.0, 27.0, 37.0, 37.0, 36.0, 37.0, 48.0, 40.0, 28.0, 42.0, 41.0, 29.0, 31.0, 32.0, 22.0, 18.0, 21.0, 12.0, 9.0, 12.0, 11.0, 9.0, 10.0, 6.0, 9.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-10.390366554260254, -10.07083797454834, -9.751310348510742, -9.431781768798828, -9.112253189086914, -8.792724609375, -8.473196983337402, -8.153668403625488, -7.834140300750732, -7.514612197875977, -7.1950836181640625, -6.875555515289307, -6.556027412414551, -6.236498832702637, -5.916970729827881, -5.597442626953125, -5.277914047241211, -4.958385944366455, -4.638857364654541, -4.319329261779785, -3.99980092048645, -3.6802725791931152, -3.3607444763183594, -3.0412161350250244, -2.7216877937316895, -2.4021594524383545, -2.0826311111450195, -1.7631030082702637, -1.4435746669769287, -1.1240463256835938, -0.8045181035995483, -0.48498988151550293, -0.16546154022216797, 0.15406674146652222, 0.4735950231552124, 0.7931233048439026, 1.1126515865325928, 1.4321799278259277, 1.7517081499099731, 2.0712363719940186, 2.3907647132873535, 2.7102930545806885, 3.0298213958740234, 3.3493494987487793, 3.6688778400421143, 3.988406181335449, 4.307934284210205, 4.627462387084961, 4.946990966796875, 5.266519069671631, 5.586047649383545, 5.905575752258301, 6.225104331970215, 6.544632434844971, 6.864160537719727, 7.183689117431641, 7.5032172203063965, 7.822745323181152, 8.142273902893066, 8.46180248260498, 8.781330108642578, 9.100858688354492, 9.420387268066406, 9.739914894104004, 10.059443473815918]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 7.0, 1.0, 19.0, 16.0, 31.0, 31.0, 66.0, 84.0, 146.0, 183.0, 276.0, 369.0, 596.0, 814.0, 1139.0, 1832.0, 2577.0, 3875.0, 6005.0, 9348.0, 14953.0, 24981.0, 44358.0, 85618.0, 198866.0, 724780.0, 2046444.0, 652088.0, 186705.0, 82544.0, 42229.0, 23681.0, 14095.0, 8790.0, 5469.0, 3665.0, 2446.0, 1668.0, 1119.0, 761.0, 495.0, 408.0, 229.0, 151.0, 107.0, 77.0, 59.0, 25.0, 28.0, 15.0, 9.0, 7.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.3671875, -13.91064453125, -13.4541015625, -12.99755859375, -12.541015625, -12.08447265625, -11.6279296875, -11.17138671875, -10.71484375, -10.25830078125, -9.8017578125, -9.34521484375, -8.888671875, -8.43212890625, -7.9755859375, -7.51904296875, -7.0625, -6.60595703125, -6.1494140625, -5.69287109375, -5.236328125, -4.77978515625, -4.3232421875, -3.86669921875, -3.41015625, -2.95361328125, -2.4970703125, -2.04052734375, -1.583984375, -1.12744140625, -0.6708984375, -0.21435546875, 0.2421875, 0.69873046875, 1.1552734375, 1.61181640625, 2.068359375, 2.52490234375, 2.9814453125, 3.43798828125, 3.89453125, 4.35107421875, 4.8076171875, 5.26416015625, 5.720703125, 6.17724609375, 6.6337890625, 7.09033203125, 7.546875, 8.00341796875, 8.4599609375, 8.91650390625, 9.373046875, 9.82958984375, 10.2861328125, 10.74267578125, 11.19921875, 11.65576171875, 12.1123046875, 12.56884765625, 13.025390625, 13.48193359375, 13.9384765625, 14.39501953125, 14.8515625]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 2.0, 8.0, 8.0, 5.0, 7.0, 10.0, 9.0, 11.0, 11.0, 16.0, 16.0, 21.0, 20.0, 35.0, 32.0, 46.0, 30.0, 30.0, 48.0, 46.0, 39.0, 38.0, 34.0, 42.0, 40.0, 39.0, 46.0, 40.0, 34.0, 38.0, 26.0, 31.0, 27.0, 22.0, 18.0, 9.0, 10.0, 11.0, 9.0, 10.0, 6.0, 6.0, 4.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.08984375, -5.90185546875, -5.7138671875, -5.52587890625, -5.337890625, -5.14990234375, -4.9619140625, -4.77392578125, -4.5859375, -4.39794921875, -4.2099609375, -4.02197265625, -3.833984375, -3.64599609375, -3.4580078125, -3.27001953125, -3.08203125, -2.89404296875, -2.7060546875, -2.51806640625, -2.330078125, -2.14208984375, -1.9541015625, -1.76611328125, -1.578125, -1.39013671875, -1.2021484375, -1.01416015625, -0.826171875, -0.63818359375, -0.4501953125, -0.26220703125, -0.07421875, 0.11376953125, 0.3017578125, 0.48974609375, 0.677734375, 0.86572265625, 1.0537109375, 1.24169921875, 1.4296875, 1.61767578125, 1.8056640625, 1.99365234375, 2.181640625, 2.36962890625, 2.5576171875, 2.74560546875, 2.93359375, 3.12158203125, 3.3095703125, 3.49755859375, 3.685546875, 3.87353515625, 4.0615234375, 4.24951171875, 4.4375, 4.62548828125, 4.8134765625, 5.00146484375, 5.189453125, 5.37744140625, 5.5654296875, 5.75341796875, 5.94140625]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 9.0, 18.0, 18.0, 20.0, 37.0, 40.0, 56.0, 102.0, 146.0, 179.0, 238.0, 400.0, 524.0, 790.0, 1149.0, 1630.0, 2520.0, 3958.0, 6300.0, 10114.0, 17457.0, 31711.0, 63002.0, 143491.0, 397933.0, 1559692.0, 1339335.0, 351744.0, 129975.0, 58587.0, 29512.0, 16529.0, 9830.0, 5933.0, 3773.0, 2363.0, 1586.0, 1117.0, 777.0, 489.0, 356.0, 244.0, 179.0, 121.0, 97.0, 49.0, 51.0, 34.0, 20.0, 17.0, 8.0, 11.0, 6.0, 5.0, 3.0, 1.0, 3.0], "bins": [-13.3203125, -12.916015625, -12.51171875, -12.107421875, -11.703125, -11.298828125, -10.89453125, -10.490234375, -10.0859375, -9.681640625, -9.27734375, -8.873046875, -8.46875, -8.064453125, -7.66015625, -7.255859375, -6.8515625, -6.447265625, -6.04296875, -5.638671875, -5.234375, -4.830078125, -4.42578125, -4.021484375, -3.6171875, -3.212890625, -2.80859375, -2.404296875, -2.0, -1.595703125, -1.19140625, -0.787109375, -0.3828125, 0.021484375, 0.42578125, 0.830078125, 1.234375, 1.638671875, 2.04296875, 2.447265625, 2.8515625, 3.255859375, 3.66015625, 4.064453125, 4.46875, 4.873046875, 5.27734375, 5.681640625, 6.0859375, 6.490234375, 6.89453125, 7.298828125, 7.703125, 8.107421875, 8.51171875, 8.916015625, 9.3203125, 9.724609375, 10.12890625, 10.533203125, 10.9375, 11.341796875, 11.74609375, 12.150390625, 12.5546875]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 6.0, 7.0, 13.0, 7.0, 12.0, 13.0, 21.0, 34.0, 25.0, 39.0, 58.0, 68.0, 93.0, 133.0, 153.0, 211.0, 250.0, 303.0, 344.0, 430.0, 345.0, 306.0, 256.0, 205.0, 152.0, 126.0, 83.0, 72.0, 56.0, 44.0, 41.0, 36.0, 30.0, 20.0, 16.0, 12.0, 5.0, 12.0, 12.0, 6.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.6328125, -3.5185546875, -3.404296875, -3.2900390625, -3.17578125, -3.0615234375, -2.947265625, -2.8330078125, -2.71875, -2.6044921875, -2.490234375, -2.3759765625, -2.26171875, -2.1474609375, -2.033203125, -1.9189453125, -1.8046875, -1.6904296875, -1.576171875, -1.4619140625, -1.34765625, -1.2333984375, -1.119140625, -1.0048828125, -0.890625, -0.7763671875, -0.662109375, -0.5478515625, -0.43359375, -0.3193359375, -0.205078125, -0.0908203125, 0.0234375, 0.1376953125, 0.251953125, 0.3662109375, 0.48046875, 0.5947265625, 0.708984375, 0.8232421875, 0.9375, 1.0517578125, 1.166015625, 1.2802734375, 1.39453125, 1.5087890625, 1.623046875, 1.7373046875, 1.8515625, 1.9658203125, 2.080078125, 2.1943359375, 2.30859375, 2.4228515625, 2.537109375, 2.6513671875, 2.765625, 2.8798828125, 2.994140625, 3.1083984375, 3.22265625, 3.3369140625, 3.451171875, 3.5654296875, 3.6796875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 5.0, 3.0, 6.0, 5.0, 7.0, 17.0, 14.0, 15.0, 17.0, 39.0, 48.0, 71.0, 83.0, 123.0, 135.0, 92.0, 85.0, 54.0, 43.0, 35.0, 25.0, 10.0, 10.0, 11.0, 5.0, 7.0, 9.0, 3.0, 4.0, 1.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-8.473067283630371, -8.128633499145508, -7.7841997146606445, -7.439765930175781, -7.095332145690918, -6.750898361206055, -6.406464576721191, -6.062030792236328, -5.717597007751465, -5.373163223266602, -5.028729438781738, -4.684295654296875, -4.339861869812012, -3.9954280853271484, -3.650994300842285, -3.306560516357422, -2.9621267318725586, -2.6176929473876953, -2.273259162902832, -1.9288253784179688, -1.5843915939331055, -1.2399578094482422, -0.8955240249633789, -0.5510902404785156, -0.20665645599365234, 0.13777732849121094, 0.4822111129760742, 0.8266448974609375, 1.1710786819458008, 1.515512466430664, 1.8599462509155273, 2.2043800354003906, 2.5488147735595703, 2.8932485580444336, 3.237682342529297, 3.58211612701416, 3.9265499114990234, 4.270983695983887, 4.61541748046875, 4.959851264953613, 5.304285049438477, 5.64871883392334, 5.993152618408203, 6.337586402893066, 6.68202018737793, 7.026453971862793, 7.370887756347656, 7.7153215408325195, 8.059755325317383, 8.404189109802246, 8.74862289428711, 9.093056678771973, 9.437490463256836, 9.7819242477417, 10.126358032226562, 10.470791816711426, 10.815225601196289, 11.159659385681152, 11.504093170166016, 11.848526954650879, 12.192960739135742, 12.537394523620605, 12.881828308105469, 13.226262092590332, 13.570695877075195]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 6.0, 5.0, 8.0, 12.0, 12.0, 16.0, 27.0, 19.0, 21.0, 25.0, 24.0, 19.0, 39.0, 36.0, 31.0, 40.0, 31.0, 31.0, 37.0, 35.0, 37.0, 41.0, 37.0, 30.0, 36.0, 40.0, 31.0, 32.0, 42.0, 38.0, 22.0, 16.0, 20.0, 16.0, 13.0, 15.0, 13.0, 10.0, 11.0, 4.0, 8.0, 3.0, 1.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-7.174876689910889, -6.962295055389404, -6.749712944030762, -6.537131309509277, -6.324549198150635, -6.11196756362915, -5.899385452270508, -5.686803817749023, -5.474222183227539, -5.261640548706055, -5.049058437347412, -4.836476802825928, -4.623894691467285, -4.411313056945801, -4.198731422424316, -3.986149311065674, -3.7735671997070312, -3.5609853267669678, -3.3484034538269043, -3.13582181930542, -2.9232397079467773, -2.710658073425293, -2.4980762004852295, -2.285494327545166, -2.0729124546051025, -1.860330581665039, -1.6477487087249756, -1.4351669549942017, -1.2225850820541382, -1.0100032091140747, -0.7974214553833008, -0.5848395824432373, -0.3722572326660156, -0.15967538952827454, 0.05290645360946655, 0.26548826694488525, 0.47807013988494873, 0.6906520128250122, 0.9032337665557861, 1.1158156394958496, 1.328397512435913, 1.5409793853759766, 1.75356125831604, 1.966143012046814, 2.178724765777588, 2.3913068771362305, 2.603888511657715, 2.8164703845977783, 3.029052257537842, 3.2416341304779053, 3.4542160034179688, 3.666797637939453, 3.8793797492980957, 4.09196138381958, 4.304543495178223, 4.517125129699707, 4.729706764221191, 4.942288398742676, 5.154870510101318, 5.367452144622803, 5.580034255981445, 5.79261589050293, 6.005197525024414, 6.217779636383057, 6.430361747741699]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 1.0, 5.0, 10.0, 8.0, 12.0, 24.0, 34.0, 45.0, 67.0, 104.0, 161.0, 231.0, 359.0, 536.0, 929.0, 1479.0, 2486.0, 4289.0, 7794.0, 15265.0, 32070.0, 77685.0, 219625.0, 401129.0, 167249.0, 61565.0, 26330.0, 12655.0, 6915.0, 3647.0, 2282.0, 1307.0, 813.0, 506.0, 305.0, 234.0, 122.0, 105.0, 55.0, 36.0, 29.0, 14.0, 16.0, 7.0, 7.0, 4.0, 2.0, 5.0, 2.0, 0.0, 1.0], "bins": [-7.16015625, -6.96331787109375, -6.7664794921875, -6.56964111328125, -6.372802734375, -6.17596435546875, -5.9791259765625, -5.78228759765625, -5.58544921875, -5.38861083984375, -5.1917724609375, -4.99493408203125, -4.798095703125, -4.60125732421875, -4.4044189453125, -4.20758056640625, -4.0107421875, -3.81390380859375, -3.6170654296875, -3.42022705078125, -3.223388671875, -3.02655029296875, -2.8297119140625, -2.63287353515625, -2.43603515625, -2.23919677734375, -2.0423583984375, -1.84552001953125, -1.648681640625, -1.45184326171875, -1.2550048828125, -1.05816650390625, -0.861328125, -0.66448974609375, -0.4676513671875, -0.27081298828125, -0.073974609375, 0.12286376953125, 0.3197021484375, 0.51654052734375, 0.71337890625, 0.91021728515625, 1.1070556640625, 1.30389404296875, 1.500732421875, 1.69757080078125, 1.8944091796875, 2.09124755859375, 2.2880859375, 2.48492431640625, 2.6817626953125, 2.87860107421875, 3.075439453125, 3.27227783203125, 3.4691162109375, 3.66595458984375, 3.86279296875, 4.05963134765625, 4.2564697265625, 4.45330810546875, 4.650146484375, 4.84698486328125, 5.0438232421875, 5.24066162109375, 5.4375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 4.0, 5.0, 5.0, 6.0, 10.0, 15.0, 10.0, 20.0, 17.0, 21.0, 17.0, 33.0, 26.0, 28.0, 45.0, 33.0, 34.0, 30.0, 36.0, 42.0, 35.0, 40.0, 38.0, 35.0, 34.0, 42.0, 43.0, 39.0, 34.0, 28.0, 26.0, 33.0, 19.0, 25.0, 18.0, 18.0, 10.0, 11.0, 6.0, 8.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-7.11328125, -6.896484375, -6.6796875, -6.462890625, -6.24609375, -6.029296875, -5.8125, -5.595703125, -5.37890625, -5.162109375, -4.9453125, -4.728515625, -4.51171875, -4.294921875, -4.078125, -3.861328125, -3.64453125, -3.427734375, -3.2109375, -2.994140625, -2.77734375, -2.560546875, -2.34375, -2.126953125, -1.91015625, -1.693359375, -1.4765625, -1.259765625, -1.04296875, -0.826171875, -0.609375, -0.392578125, -0.17578125, 0.041015625, 0.2578125, 0.474609375, 0.69140625, 0.908203125, 1.125, 1.341796875, 1.55859375, 1.775390625, 1.9921875, 2.208984375, 2.42578125, 2.642578125, 2.859375, 3.076171875, 3.29296875, 3.509765625, 3.7265625, 3.943359375, 4.16015625, 4.376953125, 4.59375, 4.810546875, 5.02734375, 5.244140625, 5.4609375, 5.677734375, 5.89453125, 6.111328125, 6.328125, 6.544921875, 6.76171875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 12.0, 13.0, 15.0, 29.0, 23.0, 31.0, 46.0, 68.0, 113.0, 148.0, 207.0, 238.0, 382.0, 527.0, 750.0, 1082.0, 1658.0, 2654.0, 4317.0, 7243.0, 14665.0, 35108.0, 112911.0, 521523.0, 238548.0, 58982.0, 21684.0, 10285.0, 5522.0, 3233.0, 2025.0, 1368.0, 925.0, 690.0, 445.0, 303.0, 242.0, 149.0, 121.0, 81.0, 54.0, 50.0, 21.0, 15.0, 17.0, 7.0, 9.0, 10.0, 8.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-7.02734375, -6.79107666015625, -6.5548095703125, -6.31854248046875, -6.082275390625, -5.84600830078125, -5.6097412109375, -5.37347412109375, -5.13720703125, -4.90093994140625, -4.6646728515625, -4.42840576171875, -4.192138671875, -3.95587158203125, -3.7196044921875, -3.48333740234375, -3.2470703125, -3.01080322265625, -2.7745361328125, -2.53826904296875, -2.302001953125, -2.06573486328125, -1.8294677734375, -1.59320068359375, -1.35693359375, -1.12066650390625, -0.8843994140625, -0.64813232421875, -0.411865234375, -0.17559814453125, 0.0606689453125, 0.29693603515625, 0.533203125, 0.76947021484375, 1.0057373046875, 1.24200439453125, 1.478271484375, 1.71453857421875, 1.9508056640625, 2.18707275390625, 2.42333984375, 2.65960693359375, 2.8958740234375, 3.13214111328125, 3.368408203125, 3.60467529296875, 3.8409423828125, 4.07720947265625, 4.3134765625, 4.54974365234375, 4.7860107421875, 5.02227783203125, 5.258544921875, 5.49481201171875, 5.7310791015625, 5.96734619140625, 6.20361328125, 6.43988037109375, 6.6761474609375, 6.91241455078125, 7.148681640625, 7.38494873046875, 7.6212158203125, 7.85748291015625, 8.09375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 5.0, 1.0, 10.0, 8.0, 15.0, 12.0, 20.0, 14.0, 21.0, 17.0, 19.0, 25.0, 33.0, 27.0, 30.0, 35.0, 29.0, 49.0, 52.0, 45.0, 30.0, 40.0, 37.0, 41.0, 53.0, 24.0, 40.0, 42.0, 39.0, 31.0, 23.0, 19.0, 15.0, 17.0, 16.0, 22.0, 10.0, 11.0, 10.0, 3.0, 5.0, 4.0, 4.0, 1.0, 0.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.07421875, -4.9241943359375, -4.774169921875, -4.6241455078125, -4.47412109375, -4.3240966796875, -4.174072265625, -4.0240478515625, -3.8740234375, -3.7239990234375, -3.573974609375, -3.4239501953125, -3.27392578125, -3.1239013671875, -2.973876953125, -2.8238525390625, -2.673828125, -2.5238037109375, -2.373779296875, -2.2237548828125, -2.07373046875, -1.9237060546875, -1.773681640625, -1.6236572265625, -1.4736328125, -1.3236083984375, -1.173583984375, -1.0235595703125, -0.87353515625, -0.7235107421875, -0.573486328125, -0.4234619140625, -0.2734375, -0.1234130859375, 0.026611328125, 0.1766357421875, 0.32666015625, 0.4766845703125, 0.626708984375, 0.7767333984375, 0.9267578125, 1.0767822265625, 1.226806640625, 1.3768310546875, 1.52685546875, 1.6768798828125, 1.826904296875, 1.9769287109375, 2.126953125, 2.2769775390625, 2.427001953125, 2.5770263671875, 2.72705078125, 2.8770751953125, 3.027099609375, 3.1771240234375, 3.3271484375, 3.4771728515625, 3.627197265625, 3.7772216796875, 3.92724609375, 4.0772705078125, 4.227294921875, 4.3773193359375, 4.52734375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 14.0, 13.0, 15.0, 22.0, 22.0, 25.0, 37.0, 39.0, 88.0, 80.0, 125.0, 187.0, 279.0, 494.0, 823.0, 1664.0, 3538.0, 9231.0, 32803.0, 667941.0, 290431.0, 26104.0, 7642.0, 3242.0, 1546.0, 793.0, 468.0, 255.0, 168.0, 122.0, 84.0, 63.0, 43.0, 25.0, 31.0, 17.0, 19.0, 10.0, 9.0, 11.0, 7.0, 5.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0], "bins": [-2.873046875, -2.788360595703125, -2.70367431640625, -2.618988037109375, -2.5343017578125, -2.449615478515625, -2.36492919921875, -2.280242919921875, -2.195556640625, -2.110870361328125, -2.02618408203125, -1.941497802734375, -1.8568115234375, -1.772125244140625, -1.68743896484375, -1.602752685546875, -1.51806640625, -1.433380126953125, -1.34869384765625, -1.264007568359375, -1.1793212890625, -1.094635009765625, -1.00994873046875, -0.925262451171875, -0.840576171875, -0.755889892578125, -0.67120361328125, -0.586517333984375, -0.5018310546875, -0.417144775390625, -0.33245849609375, -0.247772216796875, -0.1630859375, -0.078399658203125, 0.00628662109375, 0.090972900390625, 0.1756591796875, 0.260345458984375, 0.34503173828125, 0.429718017578125, 0.514404296875, 0.599090576171875, 0.68377685546875, 0.768463134765625, 0.8531494140625, 0.937835693359375, 1.02252197265625, 1.107208251953125, 1.19189453125, 1.276580810546875, 1.36126708984375, 1.445953369140625, 1.5306396484375, 1.615325927734375, 1.70001220703125, 1.784698486328125, 1.869384765625, 1.954071044921875, 2.03875732421875, 2.123443603515625, 2.2081298828125, 2.292816162109375, 2.37750244140625, 2.462188720703125, 2.546875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 19.0, 28.0, 75.0, 154.0, 359.0, 209.0, 90.0, 27.0, 17.0, 15.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0002262592315673828, -0.00021989457309246063, -0.00021352991461753845, -0.00020716525614261627, -0.0002008005976676941, -0.0001944359391927719, -0.00018807128071784973, -0.00018170662224292755, -0.00017534196376800537, -0.0001689773052930832, -0.000162612646818161, -0.00015624798834323883, -0.00014988332986831665, -0.00014351867139339447, -0.0001371540129184723, -0.0001307893544435501, -0.00012442469596862793, -0.00011806003749370575, -0.00011169537901878357, -0.00010533072054386139, -9.896606206893921e-05, -9.260140359401703e-05, -8.623674511909485e-05, -7.987208664417267e-05, -7.350742816925049e-05, -6.714276969432831e-05, -6.077811121940613e-05, -5.441345274448395e-05, -4.804879426956177e-05, -4.168413579463959e-05, -3.531947731971741e-05, -2.8954818844795227e-05, -2.2590160369873047e-05, -1.6225501894950867e-05, -9.860843420028687e-06, -3.4961849451065063e-06, 2.868473529815674e-06, 9.233132004737854e-06, 1.5597790479660034e-05, 2.1962448954582214e-05, 2.8327107429504395e-05, 3.4691765904426575e-05, 4.1056424379348755e-05, 4.7421082854270935e-05, 5.3785741329193115e-05, 6.0150399804115295e-05, 6.651505827903748e-05, 7.287971675395966e-05, 7.924437522888184e-05, 8.560903370380402e-05, 9.19736921787262e-05, 9.833835065364838e-05, 0.00010470300912857056, 0.00011106766760349274, 0.00011743232607841492, 0.0001237969845533371, 0.00013016164302825928, 0.00013652630150318146, 0.00014289095997810364, 0.00014925561845302582, 0.000155620276927948, 0.00016198493540287018, 0.00016834959387779236, 0.00017471425235271454, 0.00018107891082763672]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 4.0, 6.0, 7.0, 11.0, 13.0, 25.0, 37.0, 42.0, 55.0, 98.0, 136.0, 192.0, 292.0, 457.0, 723.0, 1063.0, 1765.0, 2908.0, 4887.0, 9096.0, 17381.0, 37285.0, 98452.0, 495833.0, 249337.0, 68405.0, 28412.0, 13713.0, 7248.0, 4039.0, 2402.0, 1476.0, 953.0, 589.0, 383.0, 252.0, 181.0, 111.0, 81.0, 57.0, 38.0, 33.0, 17.0, 14.0, 17.0, 7.0, 4.0, 6.0, 2.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.150390625, -2.08282470703125, -2.0152587890625, -1.94769287109375, -1.880126953125, -1.81256103515625, -1.7449951171875, -1.67742919921875, -1.60986328125, -1.54229736328125, -1.4747314453125, -1.40716552734375, -1.339599609375, -1.27203369140625, -1.2044677734375, -1.13690185546875, -1.0693359375, -1.00177001953125, -0.9342041015625, -0.86663818359375, -0.799072265625, -0.73150634765625, -0.6639404296875, -0.59637451171875, -0.52880859375, -0.46124267578125, -0.3936767578125, -0.32611083984375, -0.258544921875, -0.19097900390625, -0.1234130859375, -0.05584716796875, 0.01171875, 0.07928466796875, 0.1468505859375, 0.21441650390625, 0.281982421875, 0.34954833984375, 0.4171142578125, 0.48468017578125, 0.55224609375, 0.61981201171875, 0.6873779296875, 0.75494384765625, 0.822509765625, 0.89007568359375, 0.9576416015625, 1.02520751953125, 1.0927734375, 1.16033935546875, 1.2279052734375, 1.29547119140625, 1.363037109375, 1.43060302734375, 1.4981689453125, 1.56573486328125, 1.63330078125, 1.70086669921875, 1.7684326171875, 1.83599853515625, 1.903564453125, 1.97113037109375, 2.0386962890625, 2.10626220703125, 2.173828125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 0.0, 4.0, 6.0, 4.0, 7.0, 10.0, 12.0, 16.0, 20.0, 20.0, 27.0, 36.0, 67.0, 63.0, 78.0, 98.0, 83.0, 98.0, 65.0, 60.0, 62.0, 46.0, 26.0, 15.0, 19.0, 19.0, 11.0, 10.0, 4.0, 8.0, 6.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70263671875, -0.6810073852539062, -0.6593780517578125, -0.6377487182617188, -0.616119384765625, -0.5944900512695312, -0.5728607177734375, -0.5512313842773438, -0.52960205078125, -0.5079727172851562, -0.4863433837890625, -0.46471405029296875, -0.443084716796875, -0.42145538330078125, -0.3998260498046875, -0.37819671630859375, -0.3565673828125, -0.33493804931640625, -0.3133087158203125, -0.29167938232421875, -0.270050048828125, -0.24842071533203125, -0.2267913818359375, -0.20516204833984375, -0.18353271484375, -0.16190338134765625, -0.1402740478515625, -0.11864471435546875, -0.097015380859375, -0.07538604736328125, -0.0537567138671875, -0.03212738037109375, -0.010498046875, 0.01113128662109375, 0.0327606201171875, 0.05438995361328125, 0.076019287109375, 0.09764862060546875, 0.1192779541015625, 0.14090728759765625, 0.16253662109375, 0.18416595458984375, 0.2057952880859375, 0.22742462158203125, 0.249053955078125, 0.27068328857421875, 0.2923126220703125, 0.31394195556640625, 0.3355712890625, 0.35720062255859375, 0.3788299560546875, 0.40045928955078125, 0.422088623046875, 0.44371795654296875, 0.4653472900390625, 0.48697662353515625, 0.50860595703125, 0.5302352905273438, 0.5518646240234375, 0.5734939575195312, 0.595123291015625, 0.6167526245117188, 0.6383819580078125, 0.6600112915039062, 0.681640625]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 6.0, 3.0, 7.0, 5.0, 3.0, 5.0, 9.0, 9.0, 17.0, 21.0, 14.0, 34.0, 41.0, 67.0, 100.0, 107.0, 128.0, 94.0, 84.0, 61.0, 52.0, 21.0, 30.0, 13.0, 9.0, 12.0, 14.0, 3.0, 5.0, 8.0, 4.0, 2.0, 5.0, 5.0, 0.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.758175849914551, -7.428292274475098, -7.0984086990356445, -6.768525123596191, -6.438641548156738, -6.108757972717285, -5.77887487411499, -5.448991298675537, -5.119107723236084, -4.789224147796631, -4.459340572357178, -4.129456996917725, -3.7995736598968506, -3.4696900844573975, -3.1398067474365234, -2.8099231719970703, -2.480039596557617, -2.150156021118164, -1.8202725648880005, -1.490389108657837, -1.1605055332183838, -0.8306219577789307, -0.5007385015487671, -0.17085504531860352, 0.1590285301208496, 0.48891204595565796, 0.8187955617904663, 1.1486790180206299, 1.478562593460083, 1.8084461688995361, 2.13832950592041, 2.4682130813598633, 2.7980966567993164, 3.1279802322387695, 3.4578638076782227, 3.7877471446990967, 4.117630958557129, 4.447514533996582, 4.777397632598877, 5.10728120803833, 5.437164783477783, 5.767048358917236, 6.0969319343566895, 6.426815509796143, 6.7566986083984375, 7.086582183837891, 7.416465759277344, 7.746349334716797, 8.07623291015625, 8.406116485595703, 8.736000061035156, 9.06588363647461, 9.395767211914062, 9.725650787353516, 10.055534362792969, 10.385417938232422, 10.715301513671875, 11.045185089111328, 11.375068664550781, 11.704952239990234, 12.034835815429688, 12.36471939086914, 12.694602966308594, 13.024486541748047, 13.354369163513184]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 1.0, 8.0, 5.0, 11.0, 10.0, 16.0, 14.0, 17.0, 29.0, 18.0, 29.0, 22.0, 24.0, 40.0, 40.0, 30.0, 34.0, 28.0, 36.0, 34.0, 40.0, 38.0, 38.0, 32.0, 32.0, 35.0, 40.0, 36.0, 32.0, 37.0, 38.0, 15.0, 20.0, 19.0, 10.0, 18.0, 18.0, 10.0, 11.0, 11.0, 5.0, 6.0, 3.0, 1.0, 4.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-7.043219566345215, -6.831769943237305, -6.6203203201293945, -6.408870697021484, -6.197421073913574, -5.985971450805664, -5.774521827697754, -5.563072204589844, -5.351622581481934, -5.140172958374023, -4.928723335266113, -4.717273712158203, -4.505824089050293, -4.294374465942383, -4.082924842834473, -3.8714752197265625, -3.6600255966186523, -3.448575973510742, -3.237126350402832, -3.025676727294922, -2.8142271041870117, -2.6027774810791016, -2.3913278579711914, -2.1798782348632812, -1.968428611755371, -1.756978988647461, -1.5455293655395508, -1.3340797424316406, -1.1226301193237305, -0.9111804962158203, -0.6997308731079102, -0.48828125, -0.27683210372924805, -0.06538248062133789, 0.14606714248657227, 0.3575167655944824, 0.5689663887023926, 0.7804160118103027, 0.9918656349182129, 1.203315258026123, 1.4147648811340332, 1.6262145042419434, 1.8376641273498535, 2.0491137504577637, 2.260563373565674, 2.472012996673584, 2.683462619781494, 2.8949122428894043, 3.1063618659973145, 3.3178114891052246, 3.5292611122131348, 3.740710735321045, 3.952160358428955, 4.163609981536865, 4.375059604644775, 4.5865092277526855, 4.797958850860596, 5.009408473968506, 5.220858097076416, 5.432307720184326, 5.643757343292236, 5.8552069664001465, 6.066656589508057, 6.278106212615967, 6.489555835723877]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 8.0, 8.0, 7.0, 22.0, 37.0, 48.0, 67.0, 107.0, 181.0, 271.0, 399.0, 681.0, 1074.0, 1758.0, 2907.0, 4768.0, 7711.0, 13306.0, 22338.0, 38656.0, 65930.0, 112657.0, 188499.0, 224191.0, 149827.0, 87663.0, 51147.0, 30132.0, 17662.0, 10603.0, 6154.0, 3785.0, 2156.0, 1332.0, 893.0, 588.0, 317.0, 235.0, 160.0, 117.0, 55.0, 38.0, 25.0, 14.0, 8.0, 6.0, 4.0, 2.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-9.3984375, -9.107177734375, -8.81591796875, -8.524658203125, -8.2333984375, -7.942138671875, -7.65087890625, -7.359619140625, -7.068359375, -6.777099609375, -6.48583984375, -6.194580078125, -5.9033203125, -5.612060546875, -5.32080078125, -5.029541015625, -4.73828125, -4.447021484375, -4.15576171875, -3.864501953125, -3.5732421875, -3.281982421875, -2.99072265625, -2.699462890625, -2.408203125, -2.116943359375, -1.82568359375, -1.534423828125, -1.2431640625, -0.951904296875, -0.66064453125, -0.369384765625, -0.078125, 0.213134765625, 0.50439453125, 0.795654296875, 1.0869140625, 1.378173828125, 1.66943359375, 1.960693359375, 2.251953125, 2.543212890625, 2.83447265625, 3.125732421875, 3.4169921875, 3.708251953125, 3.99951171875, 4.290771484375, 4.58203125, 4.873291015625, 5.16455078125, 5.455810546875, 5.7470703125, 6.038330078125, 6.32958984375, 6.620849609375, 6.912109375, 7.203369140625, 7.49462890625, 7.785888671875, 8.0771484375, 8.368408203125, 8.65966796875, 8.950927734375, 9.2421875]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 5.0, 5.0, 9.0, 4.0, 17.0, 15.0, 19.0, 22.0, 17.0, 20.0, 28.0, 27.0, 48.0, 34.0, 33.0, 29.0, 36.0, 43.0, 38.0, 41.0, 38.0, 43.0, 35.0, 36.0, 31.0, 41.0, 42.0, 26.0, 31.0, 20.0, 32.0, 28.0, 19.0, 12.0, 16.0, 13.0, 9.0, 10.0, 6.0, 9.0, 3.0, 0.0, 4.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-6.44140625, -6.24298095703125, -6.0445556640625, -5.84613037109375, -5.647705078125, -5.44927978515625, -5.2508544921875, -5.05242919921875, -4.85400390625, -4.65557861328125, -4.4571533203125, -4.25872802734375, -4.060302734375, -3.86187744140625, -3.6634521484375, -3.46502685546875, -3.2666015625, -3.06817626953125, -2.8697509765625, -2.67132568359375, -2.472900390625, -2.27447509765625, -2.0760498046875, -1.87762451171875, -1.67919921875, -1.48077392578125, -1.2823486328125, -1.08392333984375, -0.885498046875, -0.68707275390625, -0.4886474609375, -0.29022216796875, -0.091796875, 0.10662841796875, 0.3050537109375, 0.50347900390625, 0.701904296875, 0.90032958984375, 1.0987548828125, 1.29718017578125, 1.49560546875, 1.69403076171875, 1.8924560546875, 2.09088134765625, 2.289306640625, 2.48773193359375, 2.6861572265625, 2.88458251953125, 3.0830078125, 3.28143310546875, 3.4798583984375, 3.67828369140625, 3.876708984375, 4.07513427734375, 4.2735595703125, 4.47198486328125, 4.67041015625, 4.86883544921875, 5.0672607421875, 5.26568603515625, 5.464111328125, 5.66253662109375, 5.8609619140625, 6.05938720703125, 6.2578125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 7.0, 6.0, 9.0, 11.0, 23.0, 32.0, 54.0, 80.0, 103.0, 148.0, 227.0, 385.0, 550.0, 893.0, 1464.0, 2457.0, 4105.0, 7022.0, 11990.0, 21420.0, 38210.0, 69925.0, 134391.0, 249936.0, 234789.0, 123000.0, 64951.0, 34919.0, 19804.0, 11235.0, 6476.0, 3877.0, 2260.0, 1382.0, 833.0, 524.0, 359.0, 244.0, 156.0, 99.0, 49.0, 57.0, 29.0, 21.0, 13.0, 11.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-10.3203125, -9.9866943359375, -9.653076171875, -9.3194580078125, -8.98583984375, -8.6522216796875, -8.318603515625, -7.9849853515625, -7.6513671875, -7.3177490234375, -6.984130859375, -6.6505126953125, -6.31689453125, -5.9832763671875, -5.649658203125, -5.3160400390625, -4.982421875, -4.6488037109375, -4.315185546875, -3.9815673828125, -3.64794921875, -3.3143310546875, -2.980712890625, -2.6470947265625, -2.3134765625, -1.9798583984375, -1.646240234375, -1.3126220703125, -0.97900390625, -0.6453857421875, -0.311767578125, 0.0218505859375, 0.35546875, 0.6890869140625, 1.022705078125, 1.3563232421875, 1.68994140625, 2.0235595703125, 2.357177734375, 2.6907958984375, 3.0244140625, 3.3580322265625, 3.691650390625, 4.0252685546875, 4.35888671875, 4.6925048828125, 5.026123046875, 5.3597412109375, 5.693359375, 6.0269775390625, 6.360595703125, 6.6942138671875, 7.02783203125, 7.3614501953125, 7.695068359375, 8.0286865234375, 8.3623046875, 8.6959228515625, 9.029541015625, 9.3631591796875, 9.69677734375, 10.0303955078125, 10.364013671875, 10.6976318359375, 11.03125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 6.0, 7.0, 9.0, 6.0, 10.0, 12.0, 21.0, 34.0, 28.0, 35.0, 30.0, 42.0, 32.0, 39.0, 43.0, 39.0, 49.0, 45.0, 33.0, 56.0, 35.0, 54.0, 46.0, 45.0, 38.0, 35.0, 24.0, 31.0, 26.0, 21.0, 12.0, 17.0, 10.0, 9.0, 7.0, 7.0, 6.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.16796875, -5.0030517578125, -4.838134765625, -4.6732177734375, -4.50830078125, -4.3433837890625, -4.178466796875, -4.0135498046875, -3.8486328125, -3.6837158203125, -3.518798828125, -3.3538818359375, -3.18896484375, -3.0240478515625, -2.859130859375, -2.6942138671875, -2.529296875, -2.3643798828125, -2.199462890625, -2.0345458984375, -1.86962890625, -1.7047119140625, -1.539794921875, -1.3748779296875, -1.2099609375, -1.0450439453125, -0.880126953125, -0.7152099609375, -0.55029296875, -0.3853759765625, -0.220458984375, -0.0555419921875, 0.109375, 0.2742919921875, 0.439208984375, 0.6041259765625, 0.76904296875, 0.9339599609375, 1.098876953125, 1.2637939453125, 1.4287109375, 1.5936279296875, 1.758544921875, 1.9234619140625, 2.08837890625, 2.2532958984375, 2.418212890625, 2.5831298828125, 2.748046875, 2.9129638671875, 3.077880859375, 3.2427978515625, 3.40771484375, 3.5726318359375, 3.737548828125, 3.9024658203125, 4.0673828125, 4.2322998046875, 4.397216796875, 4.5621337890625, 4.72705078125, 4.8919677734375, 5.056884765625, 5.2218017578125, 5.38671875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 7.0, 7.0, 7.0, 9.0, 23.0, 24.0, 32.0, 38.0, 66.0, 99.0, 142.0, 185.0, 329.0, 431.0, 669.0, 1085.0, 1776.0, 3010.0, 5187.0, 9581.0, 19783.0, 46778.0, 142610.0, 588016.0, 140490.0, 46004.0, 19689.0, 9459.0, 5174.0, 2899.0, 1742.0, 1075.0, 690.0, 472.0, 305.0, 201.0, 147.0, 93.0, 72.0, 48.0, 36.0, 21.0, 19.0, 9.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.53125, -17.9609375, -17.390625, -16.8203125, -16.25, -15.6796875, -15.109375, -14.5390625, -13.96875, -13.3984375, -12.828125, -12.2578125, -11.6875, -11.1171875, -10.546875, -9.9765625, -9.40625, -8.8359375, -8.265625, -7.6953125, -7.125, -6.5546875, -5.984375, -5.4140625, -4.84375, -4.2734375, -3.703125, -3.1328125, -2.5625, -1.9921875, -1.421875, -0.8515625, -0.28125, 0.2890625, 0.859375, 1.4296875, 2.0, 2.5703125, 3.140625, 3.7109375, 4.28125, 4.8515625, 5.421875, 5.9921875, 6.5625, 7.1328125, 7.703125, 8.2734375, 8.84375, 9.4140625, 9.984375, 10.5546875, 11.125, 11.6953125, 12.265625, 12.8359375, 13.40625, 13.9765625, 14.546875, 15.1171875, 15.6875, 16.2578125, 16.828125, 17.3984375, 17.96875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 6.0, 6.0, 7.0, 12.0, 9.0, 13.0, 12.0, 22.0, 30.0, 44.0, 55.0, 80.0, 107.0, 200.0, 102.0, 77.0, 50.0, 44.0, 28.0, 31.0, 22.0, 11.0, 6.0, 11.0, 7.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006074905395507812, -0.000588148832321167, -0.0005688071250915527, -0.0005494654178619385, -0.0005301237106323242, -0.00051078200340271, -0.0004914402961730957, -0.00047209858894348145, -0.0004527568817138672, -0.00043341517448425293, -0.00041407346725463867, -0.0003947317600250244, -0.00037539005279541016, -0.0003560483455657959, -0.00033670663833618164, -0.0003173649311065674, -0.0002980232238769531, -0.00027868151664733887, -0.0002593398094177246, -0.00023999810218811035, -0.0002206563949584961, -0.00020131468772888184, -0.00018197298049926758, -0.00016263127326965332, -0.00014328956604003906, -0.0001239478588104248, -0.00010460615158081055, -8.526444435119629e-05, -6.592273712158203e-05, -4.6581029891967773e-05, -2.7239322662353516e-05, -7.897615432739258e-06, 1.1444091796875e-05, 3.078579902648926e-05, 5.0127506256103516e-05, 6.946921348571777e-05, 8.881092071533203e-05, 0.00010815262794494629, 0.00012749433517456055, 0.0001468360424041748, 0.00016617774963378906, 0.00018551945686340332, 0.00020486116409301758, 0.00022420287132263184, 0.0002435445785522461, 0.00026288628578186035, 0.0002822279930114746, 0.00030156970024108887, 0.0003209114074707031, 0.0003402531147003174, 0.00035959482192993164, 0.0003789365291595459, 0.00039827823638916016, 0.0004176199436187744, 0.00043696165084838867, 0.00045630335807800293, 0.0004756450653076172, 0.0004949867725372314, 0.0005143284797668457, 0.00053367018699646, 0.0005530118942260742, 0.0005723536014556885, 0.0005916953086853027, 0.000611037015914917, 0.0006303787231445312]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 5.0, 11.0, 13.0, 18.0, 22.0, 48.0, 61.0, 99.0, 125.0, 176.0, 249.0, 401.0, 588.0, 812.0, 1266.0, 2076.0, 3295.0, 5535.0, 10265.0, 20247.0, 46818.0, 141934.0, 587021.0, 136957.0, 45696.0, 20097.0, 10047.0, 5627.0, 3190.0, 2018.0, 1247.0, 859.0, 564.0, 340.0, 240.0, 163.0, 127.0, 88.0, 64.0, 33.0, 28.0, 17.0, 25.0, 16.0, 7.0, 6.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-17.71875, -17.17333984375, -16.6279296875, -16.08251953125, -15.537109375, -14.99169921875, -14.4462890625, -13.90087890625, -13.35546875, -12.81005859375, -12.2646484375, -11.71923828125, -11.173828125, -10.62841796875, -10.0830078125, -9.53759765625, -8.9921875, -8.44677734375, -7.9013671875, -7.35595703125, -6.810546875, -6.26513671875, -5.7197265625, -5.17431640625, -4.62890625, -4.08349609375, -3.5380859375, -2.99267578125, -2.447265625, -1.90185546875, -1.3564453125, -0.81103515625, -0.265625, 0.27978515625, 0.8251953125, 1.37060546875, 1.916015625, 2.46142578125, 3.0068359375, 3.55224609375, 4.09765625, 4.64306640625, 5.1884765625, 5.73388671875, 6.279296875, 6.82470703125, 7.3701171875, 7.91552734375, 8.4609375, 9.00634765625, 9.5517578125, 10.09716796875, 10.642578125, 11.18798828125, 11.7333984375, 12.27880859375, 12.82421875, 13.36962890625, 13.9150390625, 14.46044921875, 15.005859375, 15.55126953125, 16.0966796875, 16.64208984375, 17.1875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 8.0, 8.0, 13.0, 12.0, 15.0, 24.0, 30.0, 36.0, 49.0, 54.0, 47.0, 71.0, 145.0, 63.0, 54.0, 77.0, 49.0, 50.0, 32.0, 30.0, 25.0, 21.0, 16.0, 8.0, 8.0, 5.0, 4.0, 10.0, 3.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.17578125, -4.03997802734375, -3.9041748046875, -3.76837158203125, -3.632568359375, -3.49676513671875, -3.3609619140625, -3.22515869140625, -3.08935546875, -2.95355224609375, -2.8177490234375, -2.68194580078125, -2.546142578125, -2.41033935546875, -2.2745361328125, -2.13873291015625, -2.0029296875, -1.86712646484375, -1.7313232421875, -1.59552001953125, -1.459716796875, -1.32391357421875, -1.1881103515625, -1.05230712890625, -0.91650390625, -0.78070068359375, -0.6448974609375, -0.50909423828125, -0.373291015625, -0.23748779296875, -0.1016845703125, 0.03411865234375, 0.169921875, 0.30572509765625, 0.4415283203125, 0.57733154296875, 0.713134765625, 0.84893798828125, 0.9847412109375, 1.12054443359375, 1.25634765625, 1.39215087890625, 1.5279541015625, 1.66375732421875, 1.799560546875, 1.93536376953125, 2.0711669921875, 2.20697021484375, 2.3427734375, 2.47857666015625, 2.6143798828125, 2.75018310546875, 2.885986328125, 3.02178955078125, 3.1575927734375, 3.29339599609375, 3.42919921875, 3.56500244140625, 3.7008056640625, 3.83660888671875, 3.972412109375, 4.10821533203125, 4.2440185546875, 4.37982177734375, 4.515625]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 5.0, 7.0, 10.0, 10.0, 6.0, 10.0, 20.0, 24.0, 29.0, 56.0, 66.0, 103.0, 100.0, 93.0, 107.0, 76.0, 51.0, 44.0, 27.0, 33.0, 17.0, 20.0, 11.0, 18.0, 4.0, 10.0, 5.0, 6.0, 3.0, 2.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-8.029196739196777, -7.739762783050537, -7.450328350067139, -7.160894393920898, -6.8714599609375, -6.58202600479126, -6.2925920486450195, -6.003157615661621, -5.713723659515381, -5.424289703369141, -5.134855270385742, -4.845421314239502, -4.555987358093262, -4.266552925109863, -3.977118968963623, -3.6876847743988037, -3.3982505798339844, -3.108816385269165, -2.8193821907043457, -2.5299482345581055, -2.240514039993286, -1.9510798454284668, -1.661645770072937, -1.3722116947174072, -1.082777500152588, -0.7933433651924133, -0.5039092302322388, -0.2144750952720642, 0.07495903968811035, 0.3643932342529297, 0.6538273096084595, 0.9432613849639893, 1.2326955795288086, 1.522129774093628, 1.8115638494491577, 2.1009979248046875, 2.390432119369507, 2.679866313934326, 2.9693002700805664, 3.2587344646453857, 3.548168659210205, 3.8376028537750244, 4.127037048339844, 4.416471004486084, 4.705904960632324, 4.995339393615723, 5.284773349761963, 5.574207305908203, 5.863641738891602, 6.153075695037842, 6.44251012802124, 6.7319440841674805, 7.021378517150879, 7.310812473297119, 7.600246429443359, 7.889680862426758, 8.179115295410156, 8.468549728393555, 8.757983207702637, 9.047417640686035, 9.336852073669434, 9.626285552978516, 9.915719985961914, 10.205154418945312, 10.494587898254395]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 5.0, 9.0, 13.0, 17.0, 15.0, 18.0, 18.0, 28.0, 29.0, 25.0, 44.0, 33.0, 39.0, 50.0, 37.0, 51.0, 35.0, 48.0, 49.0, 44.0, 42.0, 43.0, 40.0, 40.0, 45.0, 25.0, 22.0, 18.0, 18.0, 17.0, 22.0, 6.0, 14.0, 11.0, 3.0, 5.0, 9.0, 3.0, 2.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.674130439758301, -7.423503875732422, -7.172877311706543, -6.922250747680664, -6.671624183654785, -6.420997619628906, -6.1703715324401855, -5.919744968414307, -5.669118404388428, -5.418491840362549, -5.16786527633667, -4.917238712310791, -4.66661262512207, -4.415986061096191, -4.1653594970703125, -3.9147329330444336, -3.6641063690185547, -3.413479804992676, -3.162853240966797, -2.912226915359497, -2.661600351333618, -2.4109737873077393, -2.1603474617004395, -1.9097208976745605, -1.6590943336486816, -1.4084677696228027, -1.1578413248062134, -0.9072148203849792, -0.6565883159637451, -0.4059617519378662, -0.15533530712127686, 0.0952911376953125, 0.3459177017211914, 0.5965442061424255, 0.8471707105636597, 1.097797155380249, 1.348423719406128, 1.5990502834320068, 1.8496767282485962, 2.1003031730651855, 2.3509297370910645, 2.6015563011169434, 2.8521828651428223, 3.102809190750122, 3.353435754776001, 3.60406231880188, 3.8546886444091797, 4.105315208435059, 4.3559417724609375, 4.606568336486816, 4.857194900512695, 5.107821464538574, 5.358448028564453, 5.609074592590332, 5.859700679779053, 6.110327243804932, 6.3609538078308105, 6.6115803718566895, 6.862206935882568, 7.112833499908447, 7.363459587097168, 7.614086151123047, 7.864712715148926, 8.115339279174805, 8.365965843200684]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 8.0, 10.0, 9.0, 16.0, 19.0, 27.0, 43.0, 76.0, 105.0, 166.0, 298.0, 516.0, 791.0, 1325.0, 2146.0, 3576.0, 6001.0, 10445.0, 18604.0, 34257.0, 68186.0, 160172.0, 594252.0, 2259364.0, 705167.0, 175082.0, 72433.0, 34712.0, 18314.0, 10468.0, 6352.0, 3877.0, 2519.0, 1584.0, 1112.0, 716.0, 498.0, 338.0, 242.0, 162.0, 92.0, 73.0, 45.0, 31.0, 28.0, 8.0, 11.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-12.2734375, -11.9075927734375, -11.541748046875, -11.1759033203125, -10.81005859375, -10.4442138671875, -10.078369140625, -9.7125244140625, -9.3466796875, -8.9808349609375, -8.614990234375, -8.2491455078125, -7.88330078125, -7.5174560546875, -7.151611328125, -6.7857666015625, -6.419921875, -6.0540771484375, -5.688232421875, -5.3223876953125, -4.95654296875, -4.5906982421875, -4.224853515625, -3.8590087890625, -3.4931640625, -3.1273193359375, -2.761474609375, -2.3956298828125, -2.02978515625, -1.6639404296875, -1.298095703125, -0.9322509765625, -0.56640625, -0.2005615234375, 0.165283203125, 0.5311279296875, 0.89697265625, 1.2628173828125, 1.628662109375, 1.9945068359375, 2.3603515625, 2.7261962890625, 3.092041015625, 3.4578857421875, 3.82373046875, 4.1895751953125, 4.555419921875, 4.9212646484375, 5.287109375, 5.6529541015625, 6.018798828125, 6.3846435546875, 6.75048828125, 7.1163330078125, 7.482177734375, 7.8480224609375, 8.2138671875, 8.5797119140625, 8.945556640625, 9.3114013671875, 9.67724609375, 10.0430908203125, 10.408935546875, 10.7747802734375, 11.140625]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 1.0, 2.0, 6.0, 10.0, 11.0, 20.0, 20.0, 14.0, 16.0, 24.0, 28.0, 33.0, 35.0, 33.0, 45.0, 36.0, 42.0, 55.0, 39.0, 39.0, 44.0, 45.0, 36.0, 56.0, 40.0, 34.0, 35.0, 27.0, 28.0, 27.0, 27.0, 10.0, 22.0, 11.0, 9.0, 8.0, 8.0, 7.0, 5.0, 5.0, 5.0, 7.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.30859375, -4.16949462890625, -4.0303955078125, -3.89129638671875, -3.752197265625, -3.61309814453125, -3.4739990234375, -3.33489990234375, -3.19580078125, -3.05670166015625, -2.9176025390625, -2.77850341796875, -2.639404296875, -2.50030517578125, -2.3612060546875, -2.22210693359375, -2.0830078125, -1.94390869140625, -1.8048095703125, -1.66571044921875, -1.526611328125, -1.38751220703125, -1.2484130859375, -1.10931396484375, -0.97021484375, -0.83111572265625, -0.6920166015625, -0.55291748046875, -0.413818359375, -0.27471923828125, -0.1356201171875, 0.00347900390625, 0.142578125, 0.28167724609375, 0.4207763671875, 0.55987548828125, 0.698974609375, 0.83807373046875, 0.9771728515625, 1.11627197265625, 1.25537109375, 1.39447021484375, 1.5335693359375, 1.67266845703125, 1.811767578125, 1.95086669921875, 2.0899658203125, 2.22906494140625, 2.3681640625, 2.50726318359375, 2.6463623046875, 2.78546142578125, 2.924560546875, 3.06365966796875, 3.2027587890625, 3.34185791015625, 3.48095703125, 3.62005615234375, 3.7591552734375, 3.89825439453125, 4.037353515625, 4.17645263671875, 4.3155517578125, 4.45465087890625, 4.59375]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 7.0, 12.0, 15.0, 18.0, 20.0, 30.0, 57.0, 77.0, 99.0, 144.0, 220.0, 309.0, 505.0, 699.0, 1124.0, 1644.0, 2497.0, 3868.0, 6140.0, 9658.0, 15878.0, 27257.0, 49457.0, 100843.0, 234928.0, 708709.0, 1888641.0, 692518.0, 230736.0, 99499.0, 49172.0, 26880.0, 15584.0, 9630.0, 6107.0, 3817.0, 2576.0, 1611.0, 1088.0, 700.0, 453.0, 328.0, 207.0, 172.0, 109.0, 78.0, 51.0, 40.0, 19.0, 13.0, 15.0, 9.0, 10.0, 5.0, 3.0, 1.0, 1.0, 2.0], "bins": [-8.140625, -7.89007568359375, -7.6395263671875, -7.38897705078125, -7.138427734375, -6.88787841796875, -6.6373291015625, -6.38677978515625, -6.13623046875, -5.88568115234375, -5.6351318359375, -5.38458251953125, -5.134033203125, -4.88348388671875, -4.6329345703125, -4.38238525390625, -4.1318359375, -3.88128662109375, -3.6307373046875, -3.38018798828125, -3.129638671875, -2.87908935546875, -2.6285400390625, -2.37799072265625, -2.12744140625, -1.87689208984375, -1.6263427734375, -1.37579345703125, -1.125244140625, -0.87469482421875, -0.6241455078125, -0.37359619140625, -0.123046875, 0.12750244140625, 0.3780517578125, 0.62860107421875, 0.879150390625, 1.12969970703125, 1.3802490234375, 1.63079833984375, 1.88134765625, 2.13189697265625, 2.3824462890625, 2.63299560546875, 2.883544921875, 3.13409423828125, 3.3846435546875, 3.63519287109375, 3.8857421875, 4.13629150390625, 4.3868408203125, 4.63739013671875, 4.887939453125, 5.13848876953125, 5.3890380859375, 5.63958740234375, 5.89013671875, 6.14068603515625, 6.3912353515625, 6.64178466796875, 6.892333984375, 7.14288330078125, 7.3934326171875, 7.64398193359375, 7.89453125]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 8.0, 10.0, 8.0, 5.0, 12.0, 20.0, 17.0, 26.0, 23.0, 33.0, 36.0, 58.0, 60.0, 85.0, 107.0, 106.0, 160.0, 204.0, 185.0, 261.0, 318.0, 329.0, 348.0, 296.0, 236.0, 202.0, 165.0, 132.0, 105.0, 115.0, 79.0, 60.0, 40.0, 56.0, 25.0, 23.0, 23.0, 25.0, 20.0, 14.0, 7.0, 6.0, 5.0, 5.0, 6.0, 3.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-2.1796875, -2.112060546875, -2.04443359375, -1.976806640625, -1.9091796875, -1.841552734375, -1.77392578125, -1.706298828125, -1.638671875, -1.571044921875, -1.50341796875, -1.435791015625, -1.3681640625, -1.300537109375, -1.23291015625, -1.165283203125, -1.09765625, -1.030029296875, -0.96240234375, -0.894775390625, -0.8271484375, -0.759521484375, -0.69189453125, -0.624267578125, -0.556640625, -0.489013671875, -0.42138671875, -0.353759765625, -0.2861328125, -0.218505859375, -0.15087890625, -0.083251953125, -0.015625, 0.052001953125, 0.11962890625, 0.187255859375, 0.2548828125, 0.322509765625, 0.39013671875, 0.457763671875, 0.525390625, 0.593017578125, 0.66064453125, 0.728271484375, 0.7958984375, 0.863525390625, 0.93115234375, 0.998779296875, 1.06640625, 1.134033203125, 1.20166015625, 1.269287109375, 1.3369140625, 1.404541015625, 1.47216796875, 1.539794921875, 1.607421875, 1.675048828125, 1.74267578125, 1.810302734375, 1.8779296875, 1.945556640625, 2.01318359375, 2.080810546875, 2.1484375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 3.0, 6.0, 10.0, 13.0, 19.0, 15.0, 30.0, 46.0, 60.0, 116.0, 154.0, 129.0, 117.0, 72.0, 53.0, 52.0, 24.0, 17.0, 21.0, 10.0, 10.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.268768310546875, -7.9864420890808105, -7.704115867614746, -7.421789646148682, -7.139463424682617, -6.857137203216553, -6.574810981750488, -6.292484283447266, -6.010158538818359, -5.727832317352295, -5.4455060958862305, -5.163179874420166, -4.880853652954102, -4.598527431488037, -4.316201210021973, -4.03387451171875, -3.7515482902526855, -3.469222068786621, -3.1868958473205566, -2.904569625854492, -2.6222434043884277, -2.3399171829223633, -2.0575907230377197, -1.7752645015716553, -1.4929382801055908, -1.2106120586395264, -0.9282857775688171, -0.6459594964981079, -0.36363327503204346, -0.081307053565979, 0.201019287109375, 0.48334550857543945, 0.7656717300415039, 1.0479979515075684, 1.3303241729736328, 1.6126505136489868, 1.8949767351150513, 2.177302837371826, 2.4596292972564697, 2.741955518722534, 3.0242817401885986, 3.306607961654663, 3.5889341831207275, 3.871260643005371, 4.1535868644714355, 4.4359130859375, 4.7182393074035645, 5.000565528869629, 5.282891750335693, 5.565217971801758, 5.847544193267822, 6.129870414733887, 6.412196636199951, 6.694522857666016, 6.976849555969238, 7.2591753005981445, 7.541501998901367, 7.823828220367432, 8.106154441833496, 8.388481140136719, 8.670806884765625, 8.953133583068848, 9.235459327697754, 9.517786026000977, 9.800111770629883]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 11.0, 4.0, 7.0, 11.0, 11.0, 14.0, 17.0, 26.0, 16.0, 33.0, 27.0, 39.0, 41.0, 28.0, 30.0, 38.0, 38.0, 29.0, 35.0, 55.0, 49.0, 55.0, 42.0, 36.0, 31.0, 38.0, 35.0, 38.0, 17.0, 28.0, 22.0, 12.0, 18.0, 15.0, 13.0, 6.0, 9.0, 6.0, 4.0, 6.0, 2.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.491585731506348, -4.334229469299316, -4.176872730255127, -4.019516468048096, -3.8621599674224854, -3.704803466796875, -3.5474472045898438, -3.3900907039642334, -3.232734203338623, -3.0753777027130127, -2.9180214405059814, -2.760664939880371, -2.6033084392547607, -2.4459519386291504, -2.288595676422119, -2.131239175796509, -1.9738829135894775, -1.8165265321731567, -1.6591700315475464, -1.5018136501312256, -1.3444571495056152, -1.1871007680892944, -1.0297443866729736, -0.8723878860473633, -0.7150315046310425, -0.5576750636100769, -0.4003186523914337, -0.24296224117279053, -0.08560580015182495, 0.07175064086914062, 0.22910702228546143, 0.3864635229110718, 0.5438199043273926, 0.7011763453483582, 0.8585327863693237, 1.0158891677856445, 1.1732456684112549, 1.3306020498275757, 1.4879584312438965, 1.6453149318695068, 1.8026713132858276, 1.9600276947021484, 2.117384195327759, 2.274740695953369, 2.4320969581604004, 2.5894534587860107, 2.746809959411621, 2.9041662216186523, 3.0615227222442627, 3.218879222869873, 3.3762354850769043, 3.5335919857025146, 3.690948486328125, 3.8483047485351562, 4.0056610107421875, 4.163017749786377, 4.320374011993408, 4.4777302742004395, 4.635087013244629, 4.79244327545166, 4.949799537658691, 5.107156276702881, 5.264512538909912, 5.421869277954102, 5.579225540161133]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 4.0, 10.0, 13.0, 12.0, 19.0, 28.0, 35.0, 65.0, 112.0, 185.0, 246.0, 403.0, 656.0, 1104.0, 1898.0, 3343.0, 5894.0, 11347.0, 23709.0, 54697.0, 157048.0, 444104.0, 214798.0, 70375.0, 28637.0, 13464.0, 6994.0, 3884.0, 2121.0, 1280.0, 761.0, 469.0, 294.0, 200.0, 112.0, 80.0, 51.0, 31.0, 33.0, 12.0, 9.0, 10.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.07421875, -4.918701171875, -4.76318359375, -4.607666015625, -4.4521484375, -4.296630859375, -4.14111328125, -3.985595703125, -3.830078125, -3.674560546875, -3.51904296875, -3.363525390625, -3.2080078125, -3.052490234375, -2.89697265625, -2.741455078125, -2.5859375, -2.430419921875, -2.27490234375, -2.119384765625, -1.9638671875, -1.808349609375, -1.65283203125, -1.497314453125, -1.341796875, -1.186279296875, -1.03076171875, -0.875244140625, -0.7197265625, -0.564208984375, -0.40869140625, -0.253173828125, -0.09765625, 0.057861328125, 0.21337890625, 0.368896484375, 0.5244140625, 0.679931640625, 0.83544921875, 0.990966796875, 1.146484375, 1.302001953125, 1.45751953125, 1.613037109375, 1.7685546875, 1.924072265625, 2.07958984375, 2.235107421875, 2.390625, 2.546142578125, 2.70166015625, 2.857177734375, 3.0126953125, 3.168212890625, 3.32373046875, 3.479248046875, 3.634765625, 3.790283203125, 3.94580078125, 4.101318359375, 4.2568359375, 4.412353515625, 4.56787109375, 4.723388671875, 4.87890625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 7.0, 9.0, 10.0, 2.0, 17.0, 16.0, 21.0, 21.0, 31.0, 30.0, 28.0, 26.0, 38.0, 37.0, 33.0, 46.0, 35.0, 52.0, 56.0, 53.0, 40.0, 40.0, 46.0, 31.0, 46.0, 34.0, 30.0, 29.0, 28.0, 21.0, 13.0, 18.0, 10.0, 13.0, 9.0, 7.0, 7.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.828125, -4.6605224609375, -4.492919921875, -4.3253173828125, -4.15771484375, -3.9901123046875, -3.822509765625, -3.6549072265625, -3.4873046875, -3.3197021484375, -3.152099609375, -2.9844970703125, -2.81689453125, -2.6492919921875, -2.481689453125, -2.3140869140625, -2.146484375, -1.9788818359375, -1.811279296875, -1.6436767578125, -1.47607421875, -1.3084716796875, -1.140869140625, -0.9732666015625, -0.8056640625, -0.6380615234375, -0.470458984375, -0.3028564453125, -0.13525390625, 0.0323486328125, 0.199951171875, 0.3675537109375, 0.53515625, 0.7027587890625, 0.870361328125, 1.0379638671875, 1.20556640625, 1.3731689453125, 1.540771484375, 1.7083740234375, 1.8759765625, 2.0435791015625, 2.211181640625, 2.3787841796875, 2.54638671875, 2.7139892578125, 2.881591796875, 3.0491943359375, 3.216796875, 3.3843994140625, 3.552001953125, 3.7196044921875, 3.88720703125, 4.0548095703125, 4.222412109375, 4.3900146484375, 4.5576171875, 4.7252197265625, 4.892822265625, 5.0604248046875, 5.22802734375, 5.3956298828125, 5.563232421875, 5.7308349609375, 5.8984375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 3.0, 4.0, 6.0, 8.0, 11.0, 25.0, 21.0, 34.0, 62.0, 73.0, 125.0, 150.0, 267.0, 425.0, 612.0, 929.0, 1579.0, 2643.0, 4187.0, 8039.0, 18172.0, 54125.0, 313611.0, 524817.0, 74065.0, 22478.0, 9607.0, 4891.0, 2750.0, 1697.0, 1033.0, 739.0, 471.0, 294.0, 210.0, 116.0, 93.0, 64.0, 37.0, 30.0, 14.0, 6.0, 9.0, 11.0, 8.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.47265625, -7.25360107421875, -7.0345458984375, -6.81549072265625, -6.596435546875, -6.37738037109375, -6.1583251953125, -5.93927001953125, -5.72021484375, -5.50115966796875, -5.2821044921875, -5.06304931640625, -4.843994140625, -4.62493896484375, -4.4058837890625, -4.18682861328125, -3.9677734375, -3.74871826171875, -3.5296630859375, -3.31060791015625, -3.091552734375, -2.87249755859375, -2.6534423828125, -2.43438720703125, -2.21533203125, -1.99627685546875, -1.7772216796875, -1.55816650390625, -1.339111328125, -1.12005615234375, -0.9010009765625, -0.68194580078125, -0.462890625, -0.24383544921875, -0.0247802734375, 0.19427490234375, 0.413330078125, 0.63238525390625, 0.8514404296875, 1.07049560546875, 1.28955078125, 1.50860595703125, 1.7276611328125, 1.94671630859375, 2.165771484375, 2.38482666015625, 2.6038818359375, 2.82293701171875, 3.0419921875, 3.26104736328125, 3.4801025390625, 3.69915771484375, 3.918212890625, 4.13726806640625, 4.3563232421875, 4.57537841796875, 4.79443359375, 5.01348876953125, 5.2325439453125, 5.45159912109375, 5.670654296875, 5.88970947265625, 6.1087646484375, 6.32781982421875, 6.546875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 7.0, 6.0, 6.0, 12.0, 11.0, 9.0, 11.0, 10.0, 20.0, 18.0, 21.0, 23.0, 30.0, 32.0, 31.0, 25.0, 34.0, 30.0, 46.0, 40.0, 35.0, 39.0, 34.0, 35.0, 40.0, 43.0, 41.0, 35.0, 38.0, 33.0, 25.0, 28.0, 20.0, 25.0, 12.0, 16.0, 10.0, 18.0, 14.0, 9.0, 3.0, 5.0, 4.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.841796875, -2.7435302734375, -2.645263671875, -2.5469970703125, -2.44873046875, -2.3504638671875, -2.252197265625, -2.1539306640625, -2.0556640625, -1.9573974609375, -1.859130859375, -1.7608642578125, -1.66259765625, -1.5643310546875, -1.466064453125, -1.3677978515625, -1.26953125, -1.1712646484375, -1.072998046875, -0.9747314453125, -0.87646484375, -0.7781982421875, -0.679931640625, -0.5816650390625, -0.4833984375, -0.3851318359375, -0.286865234375, -0.1885986328125, -0.09033203125, 0.0079345703125, 0.106201171875, 0.2044677734375, 0.302734375, 0.4010009765625, 0.499267578125, 0.5975341796875, 0.69580078125, 0.7940673828125, 0.892333984375, 0.9906005859375, 1.0888671875, 1.1871337890625, 1.285400390625, 1.3836669921875, 1.48193359375, 1.5802001953125, 1.678466796875, 1.7767333984375, 1.875, 1.9732666015625, 2.071533203125, 2.1697998046875, 2.26806640625, 2.3663330078125, 2.464599609375, 2.5628662109375, 2.6611328125, 2.7593994140625, 2.857666015625, 2.9559326171875, 3.05419921875, 3.1524658203125, 3.250732421875, 3.3489990234375, 3.447265625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 9.0, 8.0, 12.0, 8.0, 28.0, 32.0, 47.0, 59.0, 91.0, 108.0, 143.0, 221.0, 261.0, 370.0, 498.0, 743.0, 1096.0, 1540.0, 2392.0, 4013.0, 7204.0, 13940.0, 32790.0, 122334.0, 702208.0, 98768.0, 29085.0, 12795.0, 6700.0, 3703.0, 2177.0, 1569.0, 1074.0, 750.0, 501.0, 320.0, 277.0, 195.0, 133.0, 91.0, 75.0, 49.0, 32.0, 28.0, 14.0, 22.0, 13.0, 10.0, 10.0, 6.0, 3.0, 1.0, 2.0, 3.0, 4.0], "bins": [-0.6865234375, -0.6659927368164062, -0.6454620361328125, -0.6249313354492188, -0.604400634765625, -0.5838699340820312, -0.5633392333984375, -0.5428085327148438, -0.52227783203125, -0.5017471313476562, -0.4812164306640625, -0.46068572998046875, -0.440155029296875, -0.41962432861328125, -0.3990936279296875, -0.37856292724609375, -0.3580322265625, -0.33750152587890625, -0.3169708251953125, -0.29644012451171875, -0.275909423828125, -0.25537872314453125, -0.2348480224609375, -0.21431732177734375, -0.19378662109375, -0.17325592041015625, -0.1527252197265625, -0.13219451904296875, -0.111663818359375, -0.09113311767578125, -0.0706024169921875, -0.05007171630859375, -0.029541015625, -0.00901031494140625, 0.0115203857421875, 0.03205108642578125, 0.052581787109375, 0.07311248779296875, 0.0936431884765625, 0.11417388916015625, 0.13470458984375, 0.15523529052734375, 0.1757659912109375, 0.19629669189453125, 0.216827392578125, 0.23735809326171875, 0.2578887939453125, 0.27841949462890625, 0.2989501953125, 0.31948089599609375, 0.3400115966796875, 0.36054229736328125, 0.381072998046875, 0.40160369873046875, 0.4221343994140625, 0.44266510009765625, 0.46319580078125, 0.48372650146484375, 0.5042572021484375, 0.5247879028320312, 0.545318603515625, 0.5658493041992188, 0.5863800048828125, 0.6069107055664062, 0.62744140625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 1.0, 3.0, 5.0, 8.0, 6.0, 14.0, 15.0, 18.0, 30.0, 25.0, 56.0, 78.0, 86.0, 143.0, 131.0, 99.0, 67.0, 46.0, 36.0, 27.0, 10.0, 15.0, 14.0, 9.0, 17.0, 5.0, 3.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.74913215637207e-05, -3.6413781344890594e-05, -3.5336241126060486e-05, -3.425870090723038e-05, -3.318116068840027e-05, -3.210362046957016e-05, -3.102608025074005e-05, -2.9948540031909943e-05, -2.8870999813079834e-05, -2.7793459594249725e-05, -2.6715919375419617e-05, -2.5638379156589508e-05, -2.45608389377594e-05, -2.348329871892929e-05, -2.2405758500099182e-05, -2.1328218281269073e-05, -2.0250678062438965e-05, -1.9173137843608856e-05, -1.8095597624778748e-05, -1.701805740594864e-05, -1.594051718711853e-05, -1.4862976968288422e-05, -1.3785436749458313e-05, -1.2707896530628204e-05, -1.1630356311798096e-05, -1.0552816092967987e-05, -9.475275874137878e-06, -8.39773565530777e-06, -7.320195436477661e-06, -6.2426552176475525e-06, -5.165114998817444e-06, -4.087574779987335e-06, -3.0100345611572266e-06, -1.932494342327118e-06, -8.549541234970093e-07, 2.2258609533309937e-07, 1.300126314163208e-06, 2.3776665329933167e-06, 3.4552067518234253e-06, 4.532746970653534e-06, 5.610287189483643e-06, 6.687827408313751e-06, 7.76536762714386e-06, 8.842907845973969e-06, 9.920448064804077e-06, 1.0997988283634186e-05, 1.2075528502464294e-05, 1.3153068721294403e-05, 1.4230608940124512e-05, 1.530814915895462e-05, 1.638568937778473e-05, 1.7463229596614838e-05, 1.8540769815444946e-05, 1.9618310034275055e-05, 2.0695850253105164e-05, 2.1773390471935272e-05, 2.285093069076538e-05, 2.392847090959549e-05, 2.5006011128425598e-05, 2.6083551347255707e-05, 2.7161091566085815e-05, 2.8238631784915924e-05, 2.9316172003746033e-05, 3.039371222257614e-05, 3.147125244140625e-05]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 7.0, 6.0, 9.0, 10.0, 16.0, 20.0, 30.0, 47.0, 66.0, 86.0, 129.0, 159.0, 281.0, 399.0, 591.0, 975.0, 1562.0, 2424.0, 4194.0, 7420.0, 14050.0, 29241.0, 77025.0, 512752.0, 282712.0, 60890.0, 24725.0, 12115.0, 6677.0, 3656.0, 2353.0, 1347.0, 862.0, 587.0, 374.0, 237.0, 156.0, 125.0, 80.0, 45.0, 39.0, 20.0, 15.0, 17.0, 9.0, 8.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.099609375, -1.061553955078125, -1.02349853515625, -0.985443115234375, -0.9473876953125, -0.909332275390625, -0.87127685546875, -0.833221435546875, -0.795166015625, -0.757110595703125, -0.71905517578125, -0.680999755859375, -0.6429443359375, -0.604888916015625, -0.56683349609375, -0.528778076171875, -0.49072265625, -0.452667236328125, -0.41461181640625, -0.376556396484375, -0.3385009765625, -0.300445556640625, -0.26239013671875, -0.224334716796875, -0.186279296875, -0.148223876953125, -0.11016845703125, -0.072113037109375, -0.0340576171875, 0.003997802734375, 0.04205322265625, 0.080108642578125, 0.1181640625, 0.156219482421875, 0.19427490234375, 0.232330322265625, 0.2703857421875, 0.308441162109375, 0.34649658203125, 0.384552001953125, 0.422607421875, 0.460662841796875, 0.49871826171875, 0.536773681640625, 0.5748291015625, 0.612884521484375, 0.65093994140625, 0.688995361328125, 0.72705078125, 0.765106201171875, 0.80316162109375, 0.841217041015625, 0.8792724609375, 0.917327880859375, 0.95538330078125, 0.993438720703125, 1.031494140625, 1.069549560546875, 1.10760498046875, 1.145660400390625, 1.1837158203125, 1.221771240234375, 1.25982666015625, 1.297882080078125, 1.3359375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 5.0, 3.0, 3.0, 5.0, 7.0, 10.0, 11.0, 16.0, 19.0, 27.0, 29.0, 42.0, 32.0, 39.0, 69.0, 86.0, 87.0, 81.0, 74.0, 68.0, 57.0, 45.0, 18.0, 21.0, 15.0, 25.0, 15.0, 13.0, 11.0, 12.0, 7.0, 10.0, 3.0, 5.0, 5.0, 5.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.303466796875, -0.2950096130371094, -0.28655242919921875, -0.2780952453613281, -0.2696380615234375, -0.2611808776855469, -0.25272369384765625, -0.24426651000976562, -0.235809326171875, -0.22735214233398438, -0.21889495849609375, -0.21043777465820312, -0.2019805908203125, -0.19352340698242188, -0.18506622314453125, -0.17660903930664062, -0.16815185546875, -0.15969467163085938, -0.15123748779296875, -0.14278030395507812, -0.1343231201171875, -0.12586593627929688, -0.11740875244140625, -0.10895156860351562, -0.100494384765625, -0.09203720092773438, -0.08358001708984375, -0.07512283325195312, -0.0666656494140625, -0.058208465576171875, -0.04975128173828125, -0.041294097900390625, -0.0328369140625, -0.024379730224609375, -0.01592254638671875, -0.007465362548828125, 0.0009918212890625, 0.009449005126953125, 0.01790618896484375, 0.026363372802734375, 0.034820556640625, 0.043277740478515625, 0.05173492431640625, 0.060192108154296875, 0.0686492919921875, 0.07710647583007812, 0.08556365966796875, 0.09402084350585938, 0.10247802734375, 0.11093521118164062, 0.11939239501953125, 0.12784957885742188, 0.1363067626953125, 0.14476394653320312, 0.15322113037109375, 0.16167831420898438, 0.170135498046875, 0.17859268188476562, 0.18704986572265625, 0.19550704956054688, 0.2039642333984375, 0.21242141723632812, 0.22087860107421875, 0.22933578491210938, 0.23779296875]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 4.0, 7.0, 12.0, 7.0, 12.0, 21.0, 26.0, 47.0, 55.0, 105.0, 148.0, 164.0, 96.0, 68.0, 57.0, 46.0, 31.0, 25.0, 10.0, 15.0, 11.0, 9.0, 4.0, 3.0, 4.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.318948745727539, -7.049448013305664, -6.779947280883789, -6.510446071624756, -6.240945339202881, -5.971444606781006, -5.701943397521973, -5.432442665100098, -5.162941932678223, -4.893441200256348, -4.623940467834473, -4.3544392585754395, -4.0849385261535645, -3.8154377937316895, -3.5459368228912354, -3.2764358520507812, -3.0069351196289062, -2.7374343872070312, -2.467933416366577, -2.198432445526123, -1.928931713104248, -1.6594308614730835, -1.389930009841919, -1.1204291582107544, -0.8509283065795898, -0.5814274549484253, -0.31192660331726074, -0.04242575168609619, 0.22707509994506836, 0.4965759515762329, 0.7660768032073975, 1.035577654838562, 1.305079460144043, 1.5745803117752075, 1.844081163406372, 2.113582134246826, 2.383082866668701, 2.652583599090576, 2.9220845699310303, 3.1915855407714844, 3.4610862731933594, 3.7305870056152344, 4.000087738037109, 4.269588947296143, 4.539089679718018, 4.808590412139893, 5.078091621398926, 5.347592353820801, 5.617093086242676, 5.886593818664551, 6.156094551086426, 6.425595760345459, 6.695096492767334, 6.964597225189209, 7.234098434448242, 7.503599166870117, 7.773099899291992, 8.042600631713867, 8.312101364135742, 8.581602096557617, 8.851102828979492, 9.120604515075684, 9.390105247497559, 9.659605979919434, 9.929106712341309]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 8.0, 4.0, 11.0, 6.0, 8.0, 15.0, 14.0, 19.0, 23.0, 18.0, 33.0, 38.0, 38.0, 33.0, 33.0, 29.0, 44.0, 27.0, 32.0, 40.0, 48.0, 61.0, 49.0, 40.0, 29.0, 37.0, 37.0, 36.0, 30.0, 23.0, 19.0, 22.0, 17.0, 15.0, 12.0, 15.0, 4.0, 7.0, 7.0, 3.0, 7.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.382505416870117, -4.22703218460083, -4.071558952331543, -3.916086196899414, -3.760612964630127, -3.60513973236084, -3.449666738510132, -3.294193744659424, -3.1387205123901367, -2.9832472801208496, -2.8277742862701416, -2.6723012924194336, -2.5168280601501465, -2.3613548278808594, -2.2058818340301514, -2.0504088401794434, -1.8949356079101562, -1.7394624948501587, -1.5839893817901611, -1.4285162687301636, -1.273043155670166, -1.1175700426101685, -0.9620969295501709, -0.8066238164901733, -0.6511507034301758, -0.4956775903701782, -0.34020447731018066, -0.1847313642501831, -0.029258251190185547, 0.126214861869812, 0.28168797492980957, 0.43716108798980713, 0.5926342010498047, 0.7481073141098022, 0.9035804271697998, 1.0590535402297974, 1.214526653289795, 1.3699997663497925, 1.52547287940979, 1.6809459924697876, 1.8364191055297852, 1.9918922185897827, 2.1473653316497803, 2.3028383255004883, 2.4583115577697754, 2.6137847900390625, 2.7692577838897705, 2.9247307777404785, 3.0802040100097656, 3.2356772422790527, 3.3911502361297607, 3.5466232299804688, 3.702096462249756, 3.857569694519043, 4.013042449951172, 4.168515682220459, 4.323988914489746, 4.479462146759033, 4.63493537902832, 4.790408134460449, 4.945881366729736, 5.101354598999023, 5.256827354431152, 5.4123005867004395, 5.567773818969727]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 5.0, 11.0, 18.0, 13.0, 19.0, 36.0, 69.0, 106.0, 118.0, 208.0, 305.0, 386.0, 596.0, 1030.0, 1526.0, 2526.0, 4350.0, 7990.0, 14932.0, 30510.0, 63162.0, 137847.0, 290425.0, 261409.0, 118663.0, 54853.0, 26638.0, 13245.0, 7088.0, 3982.0, 2346.0, 1409.0, 918.0, 564.0, 374.0, 237.0, 202.0, 136.0, 88.0, 59.0, 55.0, 33.0, 26.0, 10.0, 11.0, 7.0, 8.0, 4.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2109375, -7.9364013671875, -7.661865234375, -7.3873291015625, -7.11279296875, -6.8382568359375, -6.563720703125, -6.2891845703125, -6.0146484375, -5.7401123046875, -5.465576171875, -5.1910400390625, -4.91650390625, -4.6419677734375, -4.367431640625, -4.0928955078125, -3.818359375, -3.5438232421875, -3.269287109375, -2.9947509765625, -2.72021484375, -2.4456787109375, -2.171142578125, -1.8966064453125, -1.6220703125, -1.3475341796875, -1.072998046875, -0.7984619140625, -0.52392578125, -0.2493896484375, 0.025146484375, 0.2996826171875, 0.57421875, 0.8487548828125, 1.123291015625, 1.3978271484375, 1.67236328125, 1.9468994140625, 2.221435546875, 2.4959716796875, 2.7705078125, 3.0450439453125, 3.319580078125, 3.5941162109375, 3.86865234375, 4.1431884765625, 4.417724609375, 4.6922607421875, 4.966796875, 5.2413330078125, 5.515869140625, 5.7904052734375, 6.06494140625, 6.3394775390625, 6.614013671875, 6.8885498046875, 7.1630859375, 7.4376220703125, 7.712158203125, 7.9866943359375, 8.26123046875, 8.5357666015625, 8.810302734375, 9.0848388671875, 9.359375]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 0.0, 7.0, 5.0, 8.0, 7.0, 6.0, 16.0, 14.0, 21.0, 22.0, 29.0, 29.0, 34.0, 34.0, 29.0, 44.0, 44.0, 38.0, 32.0, 49.0, 46.0, 53.0, 59.0, 35.0, 42.0, 38.0, 40.0, 36.0, 29.0, 30.0, 23.0, 17.0, 14.0, 10.0, 12.0, 11.0, 7.0, 9.0, 6.0, 10.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.767578125, -3.625579833984375, -3.48358154296875, -3.341583251953125, -3.1995849609375, -3.057586669921875, -2.91558837890625, -2.773590087890625, -2.631591796875, -2.489593505859375, -2.34759521484375, -2.205596923828125, -2.0635986328125, -1.921600341796875, -1.77960205078125, -1.637603759765625, -1.49560546875, -1.353607177734375, -1.21160888671875, -1.069610595703125, -0.9276123046875, -0.785614013671875, -0.64361572265625, -0.501617431640625, -0.359619140625, -0.217620849609375, -0.07562255859375, 0.066375732421875, 0.2083740234375, 0.350372314453125, 0.49237060546875, 0.634368896484375, 0.7763671875, 0.918365478515625, 1.06036376953125, 1.202362060546875, 1.3443603515625, 1.486358642578125, 1.62835693359375, 1.770355224609375, 1.912353515625, 2.054351806640625, 2.19635009765625, 2.338348388671875, 2.4803466796875, 2.622344970703125, 2.76434326171875, 2.906341552734375, 3.04833984375, 3.190338134765625, 3.33233642578125, 3.474334716796875, 3.6163330078125, 3.758331298828125, 3.90032958984375, 4.042327880859375, 4.184326171875, 4.326324462890625, 4.46832275390625, 4.610321044921875, 4.7523193359375, 4.894317626953125, 5.03631591796875, 5.178314208984375, 5.3203125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 2.0, 3.0, 5.0, 6.0, 4.0, 12.0, 15.0, 23.0, 31.0, 43.0, 71.0, 116.0, 173.0, 246.0, 419.0, 615.0, 977.0, 1651.0, 2793.0, 5039.0, 8990.0, 16756.0, 32913.0, 66176.0, 143608.0, 303825.0, 243461.0, 110591.0, 52518.0, 26383.0, 13709.0, 7338.0, 3987.0, 2325.0, 1474.0, 841.0, 466.0, 299.0, 196.0, 134.0, 107.0, 62.0, 62.0, 30.0, 24.0, 19.0, 11.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.6953125, -7.4373779296875, -7.179443359375, -6.9215087890625, -6.66357421875, -6.4056396484375, -6.147705078125, -5.8897705078125, -5.6318359375, -5.3739013671875, -5.115966796875, -4.8580322265625, -4.60009765625, -4.3421630859375, -4.084228515625, -3.8262939453125, -3.568359375, -3.3104248046875, -3.052490234375, -2.7945556640625, -2.53662109375, -2.2786865234375, -2.020751953125, -1.7628173828125, -1.5048828125, -1.2469482421875, -0.989013671875, -0.7310791015625, -0.47314453125, -0.2152099609375, 0.042724609375, 0.3006591796875, 0.55859375, 0.8165283203125, 1.074462890625, 1.3323974609375, 1.59033203125, 1.8482666015625, 2.106201171875, 2.3641357421875, 2.6220703125, 2.8800048828125, 3.137939453125, 3.3958740234375, 3.65380859375, 3.9117431640625, 4.169677734375, 4.4276123046875, 4.685546875, 4.9434814453125, 5.201416015625, 5.4593505859375, 5.71728515625, 5.9752197265625, 6.233154296875, 6.4910888671875, 6.7490234375, 7.0069580078125, 7.264892578125, 7.5228271484375, 7.78076171875, 8.0386962890625, 8.296630859375, 8.5545654296875, 8.8125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 5.0, 7.0, 11.0, 7.0, 15.0, 11.0, 15.0, 16.0, 11.0, 24.0, 25.0, 34.0, 29.0, 30.0, 47.0, 28.0, 51.0, 40.0, 33.0, 34.0, 45.0, 50.0, 44.0, 30.0, 40.0, 37.0, 39.0, 33.0, 30.0, 38.0, 25.0, 26.0, 23.0, 12.0, 13.0, 8.0, 9.0, 13.0, 5.0, 4.0, 2.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.912109375, -2.818023681640625, -2.72393798828125, -2.629852294921875, -2.5357666015625, -2.441680908203125, -2.34759521484375, -2.253509521484375, -2.159423828125, -2.065338134765625, -1.97125244140625, -1.877166748046875, -1.7830810546875, -1.688995361328125, -1.59490966796875, -1.500823974609375, -1.40673828125, -1.312652587890625, -1.21856689453125, -1.124481201171875, -1.0303955078125, -0.936309814453125, -0.84222412109375, -0.748138427734375, -0.654052734375, -0.559967041015625, -0.46588134765625, -0.371795654296875, -0.2777099609375, -0.183624267578125, -0.08953857421875, 0.004547119140625, 0.0986328125, 0.192718505859375, 0.28680419921875, 0.380889892578125, 0.4749755859375, 0.569061279296875, 0.66314697265625, 0.757232666015625, 0.851318359375, 0.945404052734375, 1.03948974609375, 1.133575439453125, 1.2276611328125, 1.321746826171875, 1.41583251953125, 1.509918212890625, 1.60400390625, 1.698089599609375, 1.79217529296875, 1.886260986328125, 1.9803466796875, 2.074432373046875, 2.16851806640625, 2.262603759765625, 2.356689453125, 2.450775146484375, 2.54486083984375, 2.638946533203125, 2.7330322265625, 2.827117919921875, 2.92120361328125, 3.015289306640625, 3.109375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 3.0, 9.0, 13.0, 19.0, 23.0, 22.0, 47.0, 48.0, 67.0, 119.0, 151.0, 213.0, 320.0, 439.0, 702.0, 1031.0, 1610.0, 2590.0, 4174.0, 7114.0, 13142.0, 26165.0, 61153.0, 234002.0, 557481.0, 72778.0, 29960.0, 14651.0, 7964.0, 4582.0, 2761.0, 1760.0, 1105.0, 734.0, 480.0, 341.0, 219.0, 162.0, 121.0, 80.0, 54.0, 49.0, 23.0, 14.0, 19.0, 14.0, 10.0, 3.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.96875, -9.6580810546875, -9.347412109375, -9.0367431640625, -8.72607421875, -8.4154052734375, -8.104736328125, -7.7940673828125, -7.4833984375, -7.1727294921875, -6.862060546875, -6.5513916015625, -6.24072265625, -5.9300537109375, -5.619384765625, -5.3087158203125, -4.998046875, -4.6873779296875, -4.376708984375, -4.0660400390625, -3.75537109375, -3.4447021484375, -3.134033203125, -2.8233642578125, -2.5126953125, -2.2020263671875, -1.891357421875, -1.5806884765625, -1.27001953125, -0.9593505859375, -0.648681640625, -0.3380126953125, -0.02734375, 0.2833251953125, 0.593994140625, 0.9046630859375, 1.21533203125, 1.5260009765625, 1.836669921875, 2.1473388671875, 2.4580078125, 2.7686767578125, 3.079345703125, 3.3900146484375, 3.70068359375, 4.0113525390625, 4.322021484375, 4.6326904296875, 4.943359375, 5.2540283203125, 5.564697265625, 5.8753662109375, 6.18603515625, 6.4967041015625, 6.807373046875, 7.1180419921875, 7.4287109375, 7.7393798828125, 8.050048828125, 8.3607177734375, 8.67138671875, 8.9820556640625, 9.292724609375, 9.6033935546875, 9.9140625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 4.0, 8.0, 8.0, 10.0, 14.0, 23.0, 21.0, 30.0, 37.0, 54.0, 95.0, 204.0, 169.0, 90.0, 58.0, 41.0, 35.0, 16.0, 14.0, 13.0, 15.0, 8.0, 10.0, 2.0, 7.0, 2.0, 4.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000308990478515625, -0.00029931217432022095, -0.0002896338701248169, -0.00027995556592941284, -0.0002702772617340088, -0.00026059895753860474, -0.0002509206533432007, -0.00024124234914779663, -0.00023156404495239258, -0.00022188574075698853, -0.00021220743656158447, -0.00020252913236618042, -0.00019285082817077637, -0.00018317252397537231, -0.00017349421977996826, -0.0001638159155845642, -0.00015413761138916016, -0.0001444593071937561, -0.00013478100299835205, -0.000125102698802948, -0.00011542439460754395, -0.00010574609041213989, -9.606778621673584e-05, -8.638948202133179e-05, -7.671117782592773e-05, -6.703287363052368e-05, -5.735456943511963e-05, -4.7676265239715576e-05, -3.7997961044311523e-05, -2.831965684890747e-05, -1.8641352653503418e-05, -8.963048458099365e-06, 7.152557373046875e-07, 1.039355993270874e-05, 2.0071864128112793e-05, 2.9750168323516846e-05, 3.94284725189209e-05, 4.910677671432495e-05, 5.8785080909729004e-05, 6.846338510513306e-05, 7.814168930053711e-05, 8.781999349594116e-05, 9.749829769134521e-05, 0.00010717660188674927, 0.00011685490608215332, 0.00012653321027755737, 0.00013621151447296143, 0.00014588981866836548, 0.00015556812286376953, 0.00016524642705917358, 0.00017492473125457764, 0.0001846030354499817, 0.00019428133964538574, 0.0002039596438407898, 0.00021363794803619385, 0.0002233162522315979, 0.00023299455642700195, 0.000242672860622406, 0.00025235116481781006, 0.0002620294690132141, 0.00027170777320861816, 0.0002813860774040222, 0.00029106438159942627, 0.0003007426857948303, 0.0003104209899902344]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 8.0, 14.0, 11.0, 16.0, 27.0, 37.0, 55.0, 76.0, 96.0, 154.0, 226.0, 318.0, 479.0, 695.0, 1119.0, 1714.0, 2799.0, 4731.0, 8219.0, 15672.0, 32630.0, 88563.0, 645005.0, 152776.0, 46984.0, 20387.0, 10418.0, 5784.0, 3527.0, 2028.0, 1338.0, 855.0, 571.0, 386.0, 253.0, 171.0, 123.0, 87.0, 54.0, 46.0, 28.0, 19.0, 13.0, 16.0, 13.0, 6.0, 5.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-10.59375, -10.269775390625, -9.94580078125, -9.621826171875, -9.2978515625, -8.973876953125, -8.64990234375, -8.325927734375, -8.001953125, -7.677978515625, -7.35400390625, -7.030029296875, -6.7060546875, -6.382080078125, -6.05810546875, -5.734130859375, -5.41015625, -5.086181640625, -4.76220703125, -4.438232421875, -4.1142578125, -3.790283203125, -3.46630859375, -3.142333984375, -2.818359375, -2.494384765625, -2.17041015625, -1.846435546875, -1.5224609375, -1.198486328125, -0.87451171875, -0.550537109375, -0.2265625, 0.097412109375, 0.42138671875, 0.745361328125, 1.0693359375, 1.393310546875, 1.71728515625, 2.041259765625, 2.365234375, 2.689208984375, 3.01318359375, 3.337158203125, 3.6611328125, 3.985107421875, 4.30908203125, 4.633056640625, 4.95703125, 5.281005859375, 5.60498046875, 5.928955078125, 6.2529296875, 6.576904296875, 6.90087890625, 7.224853515625, 7.548828125, 7.872802734375, 8.19677734375, 8.520751953125, 8.8447265625, 9.168701171875, 9.49267578125, 9.816650390625, 10.140625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 2.0, 7.0, 8.0, 9.0, 9.0, 8.0, 17.0, 12.0, 15.0, 26.0, 33.0, 39.0, 51.0, 60.0, 60.0, 270.0, 79.0, 49.0, 50.0, 41.0, 22.0, 23.0, 22.0, 18.0, 19.0, 7.0, 10.0, 7.0, 5.0, 5.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.56640625, -2.482330322265625, -2.39825439453125, -2.314178466796875, -2.2301025390625, -2.146026611328125, -2.06195068359375, -1.977874755859375, -1.893798828125, -1.809722900390625, -1.72564697265625, -1.641571044921875, -1.5574951171875, -1.473419189453125, -1.38934326171875, -1.305267333984375, -1.22119140625, -1.137115478515625, -1.05303955078125, -0.968963623046875, -0.8848876953125, -0.800811767578125, -0.71673583984375, -0.632659912109375, -0.548583984375, -0.464508056640625, -0.38043212890625, -0.296356201171875, -0.2122802734375, -0.128204345703125, -0.04412841796875, 0.039947509765625, 0.1240234375, 0.208099365234375, 0.29217529296875, 0.376251220703125, 0.4603271484375, 0.544403076171875, 0.62847900390625, 0.712554931640625, 0.796630859375, 0.880706787109375, 0.96478271484375, 1.048858642578125, 1.1329345703125, 1.217010498046875, 1.30108642578125, 1.385162353515625, 1.46923828125, 1.553314208984375, 1.63739013671875, 1.721466064453125, 1.8055419921875, 1.889617919921875, 1.97369384765625, 2.057769775390625, 2.141845703125, 2.225921630859375, 2.30999755859375, 2.394073486328125, 2.4781494140625, 2.562225341796875, 2.64630126953125, 2.730377197265625, 2.814453125]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 8.0, 6.0, 8.0, 9.0, 14.0, 22.0, 23.0, 32.0, 52.0, 94.0, 118.0, 133.0, 99.0, 87.0, 58.0, 51.0, 39.0, 27.0, 22.0, 14.0, 12.0, 19.0, 7.0, 9.0, 1.0, 4.0, 7.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.4156270027160645, -6.203339099884033, -5.991051197052002, -5.778763294219971, -5.566475868225098, -5.354187965393066, -5.141900062561035, -4.929612159729004, -4.717324256896973, -4.505036354064941, -4.29274845123291, -4.080460548400879, -3.8681728839874268, -3.6558849811553955, -3.4435973167419434, -3.231309413909912, -3.019021511077881, -2.8067336082458496, -2.5944457054138184, -2.382158041000366, -2.169870138168335, -1.9575822353363037, -1.745294451713562, -1.5330066680908203, -1.320718765258789, -1.1084308624267578, -0.8961430788040161, -0.6838552355766296, -0.47156739234924316, -0.2592794895172119, -0.046991705894470215, 0.16529607772827148, 0.37758350372314453, 0.589871346950531, 0.8021591901779175, 1.0144469738006592, 1.2267348766326904, 1.4390227794647217, 1.6513105630874634, 1.863598346710205, 2.0758862495422363, 2.2881741523742676, 2.500462055206299, 2.712749719619751, 2.9250376224517822, 3.1373255252838135, 3.3496131896972656, 3.561901092529297, 3.774188995361328, 3.9864768981933594, 4.198764801025391, 4.411052703857422, 4.623340606689453, 4.835628509521484, 5.047915935516357, 5.260203838348389, 5.47249174118042, 5.684779644012451, 5.897067546844482, 6.109355449676514, 6.321642875671387, 6.533930778503418, 6.746218681335449, 6.9585065841674805, 7.170794486999512]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 6.0, 4.0, 4.0, 3.0, 9.0, 8.0, 12.0, 9.0, 12.0, 13.0, 17.0, 26.0, 25.0, 22.0, 28.0, 32.0, 31.0, 32.0, 37.0, 27.0, 33.0, 39.0, 45.0, 40.0, 40.0, 40.0, 42.0, 38.0, 30.0, 38.0, 33.0, 18.0, 33.0, 20.0, 14.0, 31.0, 16.0, 19.0, 8.0, 15.0, 13.0, 15.0, 4.0, 7.0, 6.0, 6.0, 5.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.5071539878845215, -4.365956783294678, -4.224759578704834, -4.08356237411499, -3.9423651695251465, -3.8011679649353027, -3.659970760345459, -3.5187735557556152, -3.3775763511657715, -3.2363791465759277, -3.095181941986084, -2.9539847373962402, -2.8127875328063965, -2.6715903282165527, -2.530393123626709, -2.3891959190368652, -2.2479987144470215, -2.1068015098571777, -1.965604305267334, -1.8244071006774902, -1.6832098960876465, -1.5420126914978027, -1.400815486907959, -1.2596182823181152, -1.1184210777282715, -0.9772238731384277, -0.836026668548584, -0.6948294639587402, -0.5536322593688965, -0.41243505477905273, -0.271237850189209, -0.13004064559936523, 0.011157035827636719, 0.15235424041748047, 0.2935514450073242, 0.43474864959716797, 0.5759458541870117, 0.7171430587768555, 0.8583402633666992, 0.999537467956543, 1.1407346725463867, 1.2819318771362305, 1.4231290817260742, 1.564326286315918, 1.7055234909057617, 1.8467206954956055, 1.9879179000854492, 2.129115104675293, 2.2703123092651367, 2.4115095138549805, 2.552706718444824, 2.693903923034668, 2.8351011276245117, 2.9762983322143555, 3.117495536804199, 3.258692741394043, 3.3998899459838867, 3.5410871505737305, 3.682284355163574, 3.823481559753418, 3.9646787643432617, 4.1058759689331055, 4.247073173522949, 4.388270378112793, 4.529467582702637]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 6.0, 12.0, 9.0, 20.0, 23.0, 43.0, 70.0, 68.0, 122.0, 182.0, 267.0, 368.0, 570.0, 794.0, 1091.0, 1604.0, 2282.0, 3267.0, 4758.0, 6941.0, 10436.0, 16473.0, 26698.0, 45755.0, 85475.0, 190727.0, 670048.0, 2001754.0, 721641.0, 200738.0, 86758.0, 44866.0, 25236.0, 15525.0, 9430.0, 6295.0, 4205.0, 2862.0, 2059.0, 1377.0, 974.0, 718.0, 505.0, 382.0, 241.0, 196.0, 135.0, 77.0, 72.0, 48.0, 29.0, 20.0, 8.0, 12.0, 12.0, 3.0, 3.0, 2.0, 0.0, 3.0], "bins": [-6.3203125, -6.1197509765625, -5.919189453125, -5.7186279296875, -5.51806640625, -5.3175048828125, -5.116943359375, -4.9163818359375, -4.7158203125, -4.5152587890625, -4.314697265625, -4.1141357421875, -3.91357421875, -3.7130126953125, -3.512451171875, -3.3118896484375, -3.111328125, -2.9107666015625, -2.710205078125, -2.5096435546875, -2.30908203125, -2.1085205078125, -1.907958984375, -1.7073974609375, -1.5068359375, -1.3062744140625, -1.105712890625, -0.9051513671875, -0.70458984375, -0.5040283203125, -0.303466796875, -0.1029052734375, 0.09765625, 0.2982177734375, 0.498779296875, 0.6993408203125, 0.89990234375, 1.1004638671875, 1.301025390625, 1.5015869140625, 1.7021484375, 1.9027099609375, 2.103271484375, 2.3038330078125, 2.50439453125, 2.7049560546875, 2.905517578125, 3.1060791015625, 3.306640625, 3.5072021484375, 3.707763671875, 3.9083251953125, 4.10888671875, 4.3094482421875, 4.510009765625, 4.7105712890625, 4.9111328125, 5.1116943359375, 5.312255859375, 5.5128173828125, 5.71337890625, 5.9139404296875, 6.114501953125, 6.3150634765625, 6.515625]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 3.0, 3.0, 8.0, 8.0, 7.0, 12.0, 13.0, 12.0, 16.0, 18.0, 20.0, 23.0, 15.0, 36.0, 24.0, 26.0, 43.0, 28.0, 26.0, 42.0, 34.0, 32.0, 31.0, 39.0, 39.0, 34.0, 37.0, 41.0, 36.0, 39.0, 38.0, 16.0, 20.0, 23.0, 16.0, 25.0, 19.0, 14.0, 13.0, 7.0, 12.0, 10.0, 11.0, 8.0, 6.0, 5.0, 4.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.490234375, -2.410675048828125, -2.33111572265625, -2.251556396484375, -2.1719970703125, -2.092437744140625, -2.01287841796875, -1.933319091796875, -1.853759765625, -1.774200439453125, -1.69464111328125, -1.615081787109375, -1.5355224609375, -1.455963134765625, -1.37640380859375, -1.296844482421875, -1.21728515625, -1.137725830078125, -1.05816650390625, -0.978607177734375, -0.8990478515625, -0.819488525390625, -0.73992919921875, -0.660369873046875, -0.580810546875, -0.501251220703125, -0.42169189453125, -0.342132568359375, -0.2625732421875, -0.183013916015625, -0.10345458984375, -0.023895263671875, 0.0556640625, 0.135223388671875, 0.21478271484375, 0.294342041015625, 0.3739013671875, 0.453460693359375, 0.53302001953125, 0.612579345703125, 0.692138671875, 0.771697998046875, 0.85125732421875, 0.930816650390625, 1.0103759765625, 1.089935302734375, 1.16949462890625, 1.249053955078125, 1.32861328125, 1.408172607421875, 1.48773193359375, 1.567291259765625, 1.6468505859375, 1.726409912109375, 1.80596923828125, 1.885528564453125, 1.965087890625, 2.044647216796875, 2.12420654296875, 2.203765869140625, 2.2833251953125, 2.362884521484375, 2.44244384765625, 2.522003173828125, 2.6015625]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 6.0, 4.0, 6.0, 3.0, 10.0, 12.0, 14.0, 45.0, 49.0, 75.0, 93.0, 157.0, 211.0, 274.0, 458.0, 622.0, 1001.0, 1529.0, 2395.0, 3939.0, 6479.0, 11379.0, 20291.0, 39462.0, 82857.0, 196933.0, 596789.0, 2000644.0, 789667.0, 240608.0, 97756.0, 45541.0, 23076.0, 12628.0, 7334.0, 4299.0, 2675.0, 1681.0, 1105.0, 701.0, 476.0, 310.0, 206.0, 171.0, 96.0, 68.0, 50.0, 40.0, 30.0, 24.0, 5.0, 7.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.02734375, -5.83038330078125, -5.6334228515625, -5.43646240234375, -5.239501953125, -5.04254150390625, -4.8455810546875, -4.64862060546875, -4.45166015625, -4.25469970703125, -4.0577392578125, -3.86077880859375, -3.663818359375, -3.46685791015625, -3.2698974609375, -3.07293701171875, -2.8759765625, -2.67901611328125, -2.4820556640625, -2.28509521484375, -2.088134765625, -1.89117431640625, -1.6942138671875, -1.49725341796875, -1.30029296875, -1.10333251953125, -0.9063720703125, -0.70941162109375, -0.512451171875, -0.31549072265625, -0.1185302734375, 0.07843017578125, 0.275390625, 0.47235107421875, 0.6693115234375, 0.86627197265625, 1.063232421875, 1.26019287109375, 1.4571533203125, 1.65411376953125, 1.85107421875, 2.04803466796875, 2.2449951171875, 2.44195556640625, 2.638916015625, 2.83587646484375, 3.0328369140625, 3.22979736328125, 3.4267578125, 3.62371826171875, 3.8206787109375, 4.01763916015625, 4.214599609375, 4.41156005859375, 4.6085205078125, 4.80548095703125, 5.00244140625, 5.19940185546875, 5.3963623046875, 5.59332275390625, 5.790283203125, 5.98724365234375, 6.1842041015625, 6.38116455078125, 6.578125]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 4.0, 6.0, 4.0, 11.0, 15.0, 7.0, 21.0, 22.0, 29.0, 42.0, 45.0, 55.0, 57.0, 82.0, 105.0, 122.0, 140.0, 199.0, 245.0, 241.0, 281.0, 358.0, 314.0, 284.0, 274.0, 213.0, 172.0, 153.0, 104.0, 92.0, 63.0, 61.0, 45.0, 45.0, 29.0, 27.0, 16.0, 17.0, 16.0, 8.0, 12.0, 4.0, 9.0, 5.0, 5.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0], "bins": [-1.6708984375, -1.62310791015625, -1.5753173828125, -1.52752685546875, -1.479736328125, -1.43194580078125, -1.3841552734375, -1.33636474609375, -1.28857421875, -1.24078369140625, -1.1929931640625, -1.14520263671875, -1.097412109375, -1.04962158203125, -1.0018310546875, -0.95404052734375, -0.90625, -0.85845947265625, -0.8106689453125, -0.76287841796875, -0.715087890625, -0.66729736328125, -0.6195068359375, -0.57171630859375, -0.52392578125, -0.47613525390625, -0.4283447265625, -0.38055419921875, -0.332763671875, -0.28497314453125, -0.2371826171875, -0.18939208984375, -0.1416015625, -0.09381103515625, -0.0460205078125, 0.00177001953125, 0.049560546875, 0.09735107421875, 0.1451416015625, 0.19293212890625, 0.24072265625, 0.28851318359375, 0.3363037109375, 0.38409423828125, 0.431884765625, 0.47967529296875, 0.5274658203125, 0.57525634765625, 0.623046875, 0.67083740234375, 0.7186279296875, 0.76641845703125, 0.814208984375, 0.86199951171875, 0.9097900390625, 0.95758056640625, 1.00537109375, 1.05316162109375, 1.1009521484375, 1.14874267578125, 1.196533203125, 1.24432373046875, 1.2921142578125, 1.33990478515625, 1.3876953125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 2.0, 6.0, 8.0, 11.0, 4.0, 20.0, 26.0, 32.0, 54.0, 80.0, 130.0, 173.0, 126.0, 84.0, 76.0, 46.0, 27.0, 21.0, 12.0, 16.0, 10.0, 7.0, 8.0, 2.0, 2.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.866970062255859, -6.6748175621032715, -6.482664585113525, -6.2905120849609375, -6.098359107971191, -5.9062066078186035, -5.714054107666016, -5.5219011306762695, -5.329748630523682, -5.137596130371094, -4.945443153381348, -4.75329065322876, -4.561138153076172, -4.368985176086426, -4.176832675933838, -3.984679937362671, -3.792527198791504, -3.600374460220337, -3.40822172164917, -3.216069221496582, -3.023916482925415, -2.831763744354248, -2.63961124420166, -2.447458505630493, -2.255305767059326, -2.063153028488159, -1.8710004091262817, -1.6788477897644043, -1.4866950511932373, -1.2945423126220703, -1.1023896932601929, -0.9102370738983154, -0.7180843353271484, -0.5259316563606262, -0.333778977394104, -0.1416262984275818, 0.05052638053894043, 0.24267905950546265, 0.43483173847198486, 0.6269843578338623, 0.8191370964050293, 1.0112898349761963, 1.2034424543380737, 1.3955950736999512, 1.5877478122711182, 1.7799005508422852, 1.9720531702041626, 2.16420578956604, 2.356358528137207, 2.548511266708374, 2.740664005279541, 2.932816505432129, 3.124969244003296, 3.317121982574463, 3.509274482727051, 3.7014272212982178, 3.8935799598693848, 4.085732460021973, 4.277885437011719, 4.470037937164307, 4.6621904373168945, 4.854343414306641, 5.0464959144592285, 5.238648414611816, 5.4308013916015625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 8.0, 13.0, 15.0, 11.0, 7.0, 10.0, 15.0, 16.0, 16.0, 27.0, 18.0, 32.0, 24.0, 26.0, 29.0, 39.0, 41.0, 32.0, 36.0, 41.0, 38.0, 35.0, 33.0, 33.0, 33.0, 34.0, 41.0, 39.0, 25.0, 22.0, 25.0, 20.0, 27.0, 20.0, 18.0, 11.0, 19.0, 9.0, 10.0, 6.0, 8.0, 10.0, 6.0, 9.0, 2.0, 6.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.241666316986084, -3.148360013961792, -3.0550537109375, -2.961747407913208, -2.868441104888916, -2.775135040283203, -2.681828498840332, -2.588522434234619, -2.495216131210327, -2.401909828186035, -2.308603525161743, -2.215297222137451, -2.121990919113159, -2.028684616088867, -1.9353784322738647, -1.8420722484588623, -1.7487658262252808, -1.6554595232009888, -1.5621532201766968, -1.4688470363616943, -1.3755407333374023, -1.2822344303131104, -1.1889281272888184, -1.0956218242645264, -1.0023155212402344, -0.9090092182159424, -0.8157029747962952, -0.7223966717720032, -0.629090428352356, -0.535784125328064, -0.442477822303772, -0.34917157888412476, -0.25586533546447754, -0.16255906224250793, -0.06925277411937714, 0.024053514003753662, 0.11735978722572327, 0.21066606044769287, 0.30397236347198486, 0.3972786068916321, 0.4905849099159241, 0.5838912129402161, 0.6771974563598633, 0.7705037593841553, 0.8638100624084473, 0.9571163058280945, 1.0504226684570312, 1.1437288522720337, 1.2370351552963257, 1.3303414583206177, 1.4236477613449097, 1.516953945159912, 1.610260248184204, 1.703566551208496, 1.796872854232788, 1.89017915725708, 1.983485460281372, 2.076791763305664, 2.170098066329956, 2.263404369354248, 2.35671067237854, 2.450016975402832, 2.543323040008545, 2.636629343032837, 2.729935646057129]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [9.0, 7.0, 16.0, 13.0, 22.0, 22.0, 38.0, 37.0, 53.0, 70.0, 100.0, 129.0, 186.0, 234.0, 330.0, 428.0, 624.0, 792.0, 1127.0, 1573.0, 2112.0, 2954.0, 4140.0, 5758.0, 8320.0, 12283.0, 18554.0, 29522.0, 50566.0, 94348.0, 185483.0, 268271.0, 156016.0, 79600.0, 44298.0, 26304.0, 16396.0, 11274.0, 7598.0, 5218.0, 3807.0, 2674.0, 1955.0, 1391.0, 1028.0, 729.0, 554.0, 423.0, 310.0, 233.0, 168.0, 122.0, 86.0, 66.0, 47.0, 34.0, 36.0, 26.0, 17.0, 21.0, 10.0, 7.0, 5.0, 2.0], "bins": [-1.58984375, -1.5391693115234375, -1.488494873046875, -1.4378204345703125, -1.38714599609375, -1.3364715576171875, -1.285797119140625, -1.2351226806640625, -1.1844482421875, -1.1337738037109375, -1.083099365234375, -1.0324249267578125, -0.98175048828125, -0.9310760498046875, -0.880401611328125, -0.8297271728515625, -0.779052734375, -0.7283782958984375, -0.677703857421875, -0.6270294189453125, -0.57635498046875, -0.5256805419921875, -0.475006103515625, -0.4243316650390625, -0.3736572265625, -0.3229827880859375, -0.272308349609375, -0.2216339111328125, -0.17095947265625, -0.1202850341796875, -0.069610595703125, -0.0189361572265625, 0.03173828125, 0.0824127197265625, 0.133087158203125, 0.1837615966796875, 0.23443603515625, 0.2851104736328125, 0.335784912109375, 0.3864593505859375, 0.4371337890625, 0.4878082275390625, 0.538482666015625, 0.5891571044921875, 0.63983154296875, 0.6905059814453125, 0.741180419921875, 0.7918548583984375, 0.842529296875, 0.8932037353515625, 0.943878173828125, 0.9945526123046875, 1.04522705078125, 1.0959014892578125, 1.146575927734375, 1.1972503662109375, 1.2479248046875, 1.2985992431640625, 1.349273681640625, 1.3999481201171875, 1.45062255859375, 1.5012969970703125, 1.551971435546875, 1.6026458740234375, 1.6533203125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 5.0, 5.0, 5.0, 12.0, 9.0, 16.0, 10.0, 10.0, 15.0, 20.0, 18.0, 18.0, 26.0, 23.0, 29.0, 38.0, 31.0, 36.0, 30.0, 38.0, 38.0, 51.0, 31.0, 42.0, 26.0, 40.0, 40.0, 42.0, 37.0, 25.0, 29.0, 24.0, 25.0, 27.0, 19.0, 17.0, 19.0, 21.0, 12.0, 8.0, 4.0, 7.0, 7.0, 4.0, 8.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0], "bins": [-3.462890625, -3.366119384765625, -3.26934814453125, -3.172576904296875, -3.0758056640625, -2.979034423828125, -2.88226318359375, -2.785491943359375, -2.688720703125, -2.591949462890625, -2.49517822265625, -2.398406982421875, -2.3016357421875, -2.204864501953125, -2.10809326171875, -2.011322021484375, -1.91455078125, -1.817779541015625, -1.72100830078125, -1.624237060546875, -1.5274658203125, -1.430694580078125, -1.33392333984375, -1.237152099609375, -1.140380859375, -1.043609619140625, -0.94683837890625, -0.850067138671875, -0.7532958984375, -0.656524658203125, -0.55975341796875, -0.462982177734375, -0.3662109375, -0.269439697265625, -0.17266845703125, -0.075897216796875, 0.0208740234375, 0.117645263671875, 0.21441650390625, 0.311187744140625, 0.407958984375, 0.504730224609375, 0.60150146484375, 0.698272705078125, 0.7950439453125, 0.891815185546875, 0.98858642578125, 1.085357666015625, 1.18212890625, 1.278900146484375, 1.37567138671875, 1.472442626953125, 1.5692138671875, 1.665985107421875, 1.76275634765625, 1.859527587890625, 1.956298828125, 2.053070068359375, 2.14984130859375, 2.246612548828125, 2.3433837890625, 2.440155029296875, 2.53692626953125, 2.633697509765625, 2.73046875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [8.0, 2.0, 7.0, 11.0, 9.0, 14.0, 8.0, 19.0, 32.0, 35.0, 65.0, 84.0, 93.0, 135.0, 162.0, 270.0, 308.0, 422.0, 539.0, 755.0, 1028.0, 1464.0, 2071.0, 2956.0, 4623.0, 7361.0, 13810.0, 29817.0, 80953.0, 342408.0, 399477.0, 89302.0, 31989.0, 14911.0, 7852.0, 4783.0, 3110.0, 2074.0, 1461.0, 1039.0, 801.0, 564.0, 429.0, 346.0, 267.0, 187.0, 143.0, 96.0, 83.0, 42.0, 42.0, 32.0, 15.0, 15.0, 15.0, 11.0, 6.0, 3.0, 1.0, 5.0, 3.0, 0.0, 1.0, 2.0], "bins": [-2.669921875, -2.5810546875, -2.4921875, -2.4033203125, -2.314453125, -2.2255859375, -2.13671875, -2.0478515625, -1.958984375, -1.8701171875, -1.78125, -1.6923828125, -1.603515625, -1.5146484375, -1.42578125, -1.3369140625, -1.248046875, -1.1591796875, -1.0703125, -0.9814453125, -0.892578125, -0.8037109375, -0.71484375, -0.6259765625, -0.537109375, -0.4482421875, -0.359375, -0.2705078125, -0.181640625, -0.0927734375, -0.00390625, 0.0849609375, 0.173828125, 0.2626953125, 0.3515625, 0.4404296875, 0.529296875, 0.6181640625, 0.70703125, 0.7958984375, 0.884765625, 0.9736328125, 1.0625, 1.1513671875, 1.240234375, 1.3291015625, 1.41796875, 1.5068359375, 1.595703125, 1.6845703125, 1.7734375, 1.8623046875, 1.951171875, 2.0400390625, 2.12890625, 2.2177734375, 2.306640625, 2.3955078125, 2.484375, 2.5732421875, 2.662109375, 2.7509765625, 2.83984375, 2.9287109375, 3.017578125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 0.0, 1.0, 6.0, 6.0, 8.0, 7.0, 12.0, 15.0, 23.0, 16.0, 14.0, 19.0, 12.0, 24.0, 28.0, 28.0, 28.0, 36.0, 40.0, 38.0, 50.0, 36.0, 35.0, 47.0, 37.0, 49.0, 40.0, 30.0, 36.0, 32.0, 28.0, 30.0, 36.0, 20.0, 22.0, 25.0, 22.0, 16.0, 14.0, 8.0, 9.0, 3.0, 8.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8955078125, -1.8301849365234375, -1.764862060546875, -1.6995391845703125, -1.63421630859375, -1.5688934326171875, -1.503570556640625, -1.4382476806640625, -1.3729248046875, -1.3076019287109375, -1.242279052734375, -1.1769561767578125, -1.11163330078125, -1.0463104248046875, -0.980987548828125, -0.9156646728515625, -0.850341796875, -0.7850189208984375, -0.719696044921875, -0.6543731689453125, -0.58905029296875, -0.5237274169921875, -0.458404541015625, -0.3930816650390625, -0.3277587890625, -0.2624359130859375, -0.197113037109375, -0.1317901611328125, -0.06646728515625, -0.0011444091796875, 0.064178466796875, 0.1295013427734375, 0.19482421875, 0.2601470947265625, 0.325469970703125, 0.3907928466796875, 0.45611572265625, 0.5214385986328125, 0.586761474609375, 0.6520843505859375, 0.7174072265625, 0.7827301025390625, 0.848052978515625, 0.9133758544921875, 0.97869873046875, 1.0440216064453125, 1.109344482421875, 1.1746673583984375, 1.239990234375, 1.3053131103515625, 1.370635986328125, 1.4359588623046875, 1.50128173828125, 1.5666046142578125, 1.631927490234375, 1.6972503662109375, 1.7625732421875, 1.8278961181640625, 1.893218994140625, 1.9585418701171875, 2.02386474609375, 2.0891876220703125, 2.154510498046875, 2.2198333740234375, 2.28515625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 6.0, 8.0, 13.0, 29.0, 31.0, 43.0, 59.0, 50.0, 88.0, 125.0, 173.0, 317.0, 402.0, 578.0, 844.0, 1368.0, 2392.0, 4190.0, 8525.0, 20641.0, 74589.0, 733592.0, 145993.0, 30341.0, 11175.0, 5175.0, 2937.0, 1684.0, 972.0, 698.0, 455.0, 333.0, 207.0, 140.0, 107.0, 69.0, 70.0, 33.0, 28.0, 17.0, 15.0, 10.0, 7.0, 10.0, 3.0, 1.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.73681640625, -0.714935302734375, -0.69305419921875, -0.671173095703125, -0.6492919921875, -0.627410888671875, -0.60552978515625, -0.583648681640625, -0.561767578125, -0.539886474609375, -0.51800537109375, -0.496124267578125, -0.4742431640625, -0.452362060546875, -0.43048095703125, -0.408599853515625, -0.38671875, -0.364837646484375, -0.34295654296875, -0.321075439453125, -0.2991943359375, -0.277313232421875, -0.25543212890625, -0.233551025390625, -0.211669921875, -0.189788818359375, -0.16790771484375, -0.146026611328125, -0.1241455078125, -0.102264404296875, -0.08038330078125, -0.058502197265625, -0.03662109375, -0.014739990234375, 0.00714111328125, 0.029022216796875, 0.0509033203125, 0.072784423828125, 0.09466552734375, 0.116546630859375, 0.138427734375, 0.160308837890625, 0.18218994140625, 0.204071044921875, 0.2259521484375, 0.247833251953125, 0.26971435546875, 0.291595458984375, 0.3134765625, 0.335357666015625, 0.35723876953125, 0.379119873046875, 0.4010009765625, 0.422882080078125, 0.44476318359375, 0.466644287109375, 0.488525390625, 0.510406494140625, 0.53228759765625, 0.554168701171875, 0.5760498046875, 0.597930908203125, 0.61981201171875, 0.641693115234375, 0.66357421875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 8.0, 16.0, 23.0, 29.0, 36.0, 60.0, 101.0, 140.0, 173.0, 138.0, 75.0, 45.0, 47.0, 22.0, 17.0, 13.0, 9.0, 7.0, 7.0, 9.0, 5.0, 2.0, 2.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.796815872192383e-05, -3.68291512131691e-05, -3.569014370441437e-05, -3.455113619565964e-05, -3.341212868690491e-05, -3.227312117815018e-05, -3.113411366939545e-05, -2.9995106160640717e-05, -2.8856098651885986e-05, -2.7717091143131256e-05, -2.6578083634376526e-05, -2.5439076125621796e-05, -2.4300068616867065e-05, -2.3161061108112335e-05, -2.2022053599357605e-05, -2.0883046090602875e-05, -1.9744038581848145e-05, -1.8605031073093414e-05, -1.7466023564338684e-05, -1.6327016055583954e-05, -1.5188008546829224e-05, -1.4049001038074493e-05, -1.2909993529319763e-05, -1.1770986020565033e-05, -1.0631978511810303e-05, -9.492971003055573e-06, -8.353963494300842e-06, -7.214955985546112e-06, -6.075948476791382e-06, -4.936940968036652e-06, -3.7979334592819214e-06, -2.658925950527191e-06, -1.519918441772461e-06, -3.809109330177307e-07, 7.580965757369995e-07, 1.8971040844917297e-06, 3.03611159324646e-06, 4.17511910200119e-06, 5.31412661075592e-06, 6.453134119510651e-06, 7.592141628265381e-06, 8.731149137020111e-06, 9.870156645774841e-06, 1.1009164154529572e-05, 1.2148171663284302e-05, 1.3287179172039032e-05, 1.4426186680793762e-05, 1.5565194189548492e-05, 1.6704201698303223e-05, 1.7843209207057953e-05, 1.8982216715812683e-05, 2.0121224224567413e-05, 2.1260231733322144e-05, 2.2399239242076874e-05, 2.3538246750831604e-05, 2.4677254259586334e-05, 2.5816261768341064e-05, 2.6955269277095795e-05, 2.8094276785850525e-05, 2.9233284294605255e-05, 3.0372291803359985e-05, 3.1511299312114716e-05, 3.2650306820869446e-05, 3.3789314329624176e-05, 3.4928321838378906e-05]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 7.0, 4.0, 2.0, 18.0, 15.0, 31.0, 43.0, 46.0, 70.0, 97.0, 152.0, 201.0, 278.0, 447.0, 643.0, 1049.0, 1488.0, 2451.0, 3984.0, 6633.0, 11718.0, 22039.0, 47029.0, 139503.0, 549809.0, 156005.0, 50663.0, 23361.0, 12362.0, 7054.0, 4100.0, 2584.0, 1578.0, 999.0, 647.0, 464.0, 294.0, 215.0, 122.0, 125.0, 57.0, 42.0, 32.0, 27.0, 24.0, 11.0, 12.0, 7.0, 6.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.63818359375, -0.6191558837890625, -0.600128173828125, -0.5811004638671875, -0.56207275390625, -0.5430450439453125, -0.524017333984375, -0.5049896240234375, -0.4859619140625, -0.4669342041015625, -0.447906494140625, -0.4288787841796875, -0.40985107421875, -0.3908233642578125, -0.371795654296875, -0.3527679443359375, -0.333740234375, -0.3147125244140625, -0.295684814453125, -0.2766571044921875, -0.25762939453125, -0.2386016845703125, -0.219573974609375, -0.2005462646484375, -0.1815185546875, -0.1624908447265625, -0.143463134765625, -0.1244354248046875, -0.10540771484375, -0.0863800048828125, -0.067352294921875, -0.0483245849609375, -0.029296875, -0.0102691650390625, 0.008758544921875, 0.0277862548828125, 0.04681396484375, 0.0658416748046875, 0.084869384765625, 0.1038970947265625, 0.1229248046875, 0.1419525146484375, 0.160980224609375, 0.1800079345703125, 0.19903564453125, 0.2180633544921875, 0.237091064453125, 0.2561187744140625, 0.275146484375, 0.2941741943359375, 0.313201904296875, 0.3322296142578125, 0.35125732421875, 0.3702850341796875, 0.389312744140625, 0.4083404541015625, 0.4273681640625, 0.4463958740234375, 0.465423583984375, 0.4844512939453125, 0.50347900390625, 0.5225067138671875, 0.541534423828125, 0.5605621337890625, 0.57958984375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 1.0, 5.0, 4.0, 2.0, 7.0, 13.0, 12.0, 8.0, 11.0, 15.0, 12.0, 19.0, 21.0, 28.0, 33.0, 33.0, 63.0, 84.0, 111.0, 97.0, 89.0, 59.0, 54.0, 42.0, 38.0, 21.0, 21.0, 18.0, 17.0, 3.0, 11.0, 10.0, 5.0, 6.0, 5.0, 3.0, 5.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.1754150390625, -0.1701030731201172, -0.16479110717773438, -0.15947914123535156, -0.15416717529296875, -0.14885520935058594, -0.14354324340820312, -0.1382312774658203, -0.1329193115234375, -0.1276073455810547, -0.12229537963867188, -0.11698341369628906, -0.11167144775390625, -0.10635948181152344, -0.10104751586914062, -0.09573554992675781, -0.090423583984375, -0.08511161804199219, -0.07979965209960938, -0.07448768615722656, -0.06917572021484375, -0.06386375427246094, -0.058551788330078125, -0.05323982238769531, -0.0479278564453125, -0.04261589050292969, -0.037303924560546875, -0.03199195861816406, -0.02667999267578125, -0.021368026733398438, -0.016056060791015625, -0.010744094848632812, -0.00543212890625, -0.0001201629638671875, 0.005191802978515625, 0.010503768920898438, 0.01581573486328125, 0.021127700805664062, 0.026439666748046875, 0.03175163269042969, 0.0370635986328125, 0.04237556457519531, 0.047687530517578125, 0.05299949645996094, 0.05831146240234375, 0.06362342834472656, 0.06893539428710938, 0.07424736022949219, 0.079559326171875, 0.08487129211425781, 0.09018325805664062, 0.09549522399902344, 0.10080718994140625, 0.10611915588378906, 0.11143112182617188, 0.11674308776855469, 0.1220550537109375, 0.1273670196533203, 0.13267898559570312, 0.13799095153808594, 0.14330291748046875, 0.14861488342285156, 0.15392684936523438, 0.1592388153076172, 0.16455078125]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 1.0, 5.0, 11.0, 7.0, 13.0, 17.0, 27.0, 37.0, 54.0, 93.0, 155.0, 158.0, 116.0, 83.0, 68.0, 39.0, 21.0, 19.0, 14.0, 15.0, 11.0, 8.0, 6.0, 2.0, 4.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.755007743835449, -6.5637431144714355, -6.372478485107422, -6.181213855743408, -5.9899492263793945, -5.798684597015381, -5.607419967651367, -5.416154861450195, -5.22489070892334, -5.033626079559326, -4.8423614501953125, -4.651096820831299, -4.459832191467285, -4.2685675621032715, -4.077302932739258, -3.886038064956665, -3.6947731971740723, -3.5035085678100586, -3.312243938446045, -3.1209793090820312, -2.9297146797180176, -2.738450050354004, -2.547185182571411, -2.3559205532073975, -2.164655923843384, -1.9733912944793701, -1.7821266651153564, -1.5908619165420532, -1.3995972871780396, -1.2083326578140259, -1.0170679092407227, -0.825803279876709, -0.6345386505126953, -0.44327399134635925, -0.2520093321800232, -0.060744643211364746, 0.13051998615264893, 0.3217846155166626, 0.5130493640899658, 0.7043139934539795, 0.8955786228179932, 1.0868432521820068, 1.2781078815460205, 1.4693726301193237, 1.6606372594833374, 1.851901888847351, 2.0431666374206543, 2.234431266784668, 2.4256958961486816, 2.6169605255126953, 2.808225154876709, 2.9994897842407227, 3.1907544136047363, 3.38201904296875, 3.5732839107513428, 3.7645485401153564, 3.95581316947937, 4.147078037261963, 4.338342666625977, 4.52960729598999, 4.720871925354004, 4.912136554718018, 5.103401184082031, 5.294665813446045, 5.485930442810059]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 7.0, 2.0, 5.0, 6.0, 17.0, 14.0, 5.0, 12.0, 7.0, 20.0, 17.0, 14.0, 26.0, 20.0, 28.0, 22.0, 30.0, 31.0, 41.0, 33.0, 41.0, 32.0, 39.0, 38.0, 32.0, 37.0, 31.0, 39.0, 31.0, 40.0, 39.0, 25.0, 21.0, 28.0, 23.0, 20.0, 20.0, 17.0, 16.0, 16.0, 10.0, 10.0, 10.0, 4.0, 10.0, 10.0, 3.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-3.2192859649658203, -3.1271839141845703, -3.0350818634033203, -2.9429798126220703, -2.8508777618408203, -2.7587757110595703, -2.6666736602783203, -2.5745716094970703, -2.4824695587158203, -2.3903675079345703, -2.2982654571533203, -2.2061634063720703, -2.1140613555908203, -2.0219593048095703, -1.9298571348190308, -1.8377550840377808, -1.7456529140472412, -1.6535508632659912, -1.5614488124847412, -1.4693467617034912, -1.3772447109222412, -1.2851426601409912, -1.1930404901504517, -1.1009384393692017, -1.0088363885879517, -0.9167343378067017, -0.8246322870254517, -0.7325301766395569, -0.6404281258583069, -0.5483260750770569, -0.4562239646911621, -0.3641219139099121, -0.2720198631286621, -0.17991779744625092, -0.08781573176383972, 0.004286348819732666, 0.09638839960098267, 0.18849045038223267, 0.28059256076812744, 0.37269461154937744, 0.46479666233062744, 0.5568987131118774, 0.6490007638931274, 0.7411028742790222, 0.8332049250602722, 0.9253069758415222, 1.017409086227417, 1.109511137008667, 1.201613187789917, 1.293715238571167, 1.385817289352417, 1.477919340133667, 1.570021390914917, 1.662123441696167, 1.7542256116867065, 1.8463276624679565, 1.9384297132492065, 2.030531883239746, 2.122633934020996, 2.214735984802246, 2.306838035583496, 2.398940086364746, 2.491042137145996, 2.583144187927246, 2.675246238708496]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 6.0, 9.0, 12.0, 12.0, 12.0, 17.0, 27.0, 39.0, 69.0, 89.0, 120.0, 165.0, 271.0, 375.0, 552.0, 823.0, 1236.0, 1931.0, 3039.0, 4555.0, 7942.0, 13532.0, 24182.0, 44544.0, 84916.0, 169189.0, 278319.0, 196187.0, 98307.0, 51288.0, 27516.0, 15440.0, 8817.0, 5301.0, 3402.0, 2218.0, 1321.0, 854.0, 578.0, 408.0, 268.0, 191.0, 144.0, 96.0, 80.0, 53.0, 37.0, 28.0, 19.0, 17.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.98828125, -4.81982421875, -4.6513671875, -4.48291015625, -4.314453125, -4.14599609375, -3.9775390625, -3.80908203125, -3.640625, -3.47216796875, -3.3037109375, -3.13525390625, -2.966796875, -2.79833984375, -2.6298828125, -2.46142578125, -2.29296875, -2.12451171875, -1.9560546875, -1.78759765625, -1.619140625, -1.45068359375, -1.2822265625, -1.11376953125, -0.9453125, -0.77685546875, -0.6083984375, -0.43994140625, -0.271484375, -0.10302734375, 0.0654296875, 0.23388671875, 0.40234375, 0.57080078125, 0.7392578125, 0.90771484375, 1.076171875, 1.24462890625, 1.4130859375, 1.58154296875, 1.75, 1.91845703125, 2.0869140625, 2.25537109375, 2.423828125, 2.59228515625, 2.7607421875, 2.92919921875, 3.09765625, 3.26611328125, 3.4345703125, 3.60302734375, 3.771484375, 3.93994140625, 4.1083984375, 4.27685546875, 4.4453125, 4.61376953125, 4.7822265625, 4.95068359375, 5.119140625, 5.28759765625, 5.4560546875, 5.62451171875, 5.79296875]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 0.0, 2.0, 3.0, 9.0, 11.0, 10.0, 7.0, 8.0, 11.0, 19.0, 8.0, 14.0, 20.0, 28.0, 28.0, 21.0, 30.0, 33.0, 42.0, 28.0, 39.0, 30.0, 43.0, 31.0, 37.0, 43.0, 30.0, 37.0, 39.0, 38.0, 30.0, 24.0, 28.0, 31.0, 20.0, 29.0, 9.0, 21.0, 16.0, 15.0, 18.0, 15.0, 10.0, 9.0, 8.0, 5.0, 4.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 3.0], "bins": [-2.67578125, -2.5987548828125, -2.521728515625, -2.4447021484375, -2.36767578125, -2.2906494140625, -2.213623046875, -2.1365966796875, -2.0595703125, -1.9825439453125, -1.905517578125, -1.8284912109375, -1.75146484375, -1.6744384765625, -1.597412109375, -1.5203857421875, -1.443359375, -1.3663330078125, -1.289306640625, -1.2122802734375, -1.13525390625, -1.0582275390625, -0.981201171875, -0.9041748046875, -0.8271484375, -0.7501220703125, -0.673095703125, -0.5960693359375, -0.51904296875, -0.4420166015625, -0.364990234375, -0.2879638671875, -0.2109375, -0.1339111328125, -0.056884765625, 0.0201416015625, 0.09716796875, 0.1741943359375, 0.251220703125, 0.3282470703125, 0.4052734375, 0.4822998046875, 0.559326171875, 0.6363525390625, 0.71337890625, 0.7904052734375, 0.867431640625, 0.9444580078125, 1.021484375, 1.0985107421875, 1.175537109375, 1.2525634765625, 1.32958984375, 1.4066162109375, 1.483642578125, 1.5606689453125, 1.6376953125, 1.7147216796875, 1.791748046875, 1.8687744140625, 1.94580078125, 2.0228271484375, 2.099853515625, 2.1768798828125, 2.25390625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 8.0, 17.0, 16.0, 26.0, 51.0, 63.0, 85.0, 110.0, 185.0, 248.0, 382.0, 511.0, 874.0, 1331.0, 2307.0, 3821.0, 6836.0, 11800.0, 21547.0, 41318.0, 82433.0, 163695.0, 272877.0, 211353.0, 108568.0, 54569.0, 27906.0, 14957.0, 8201.0, 4797.0, 2763.0, 1749.0, 1093.0, 652.0, 417.0, 331.0, 195.0, 136.0, 96.0, 81.0, 45.0, 29.0, 26.0, 9.0, 11.0, 6.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.98046875, -4.8182373046875, -4.656005859375, -4.4937744140625, -4.33154296875, -4.1693115234375, -4.007080078125, -3.8448486328125, -3.6826171875, -3.5203857421875, -3.358154296875, -3.1959228515625, -3.03369140625, -2.8714599609375, -2.709228515625, -2.5469970703125, -2.384765625, -2.2225341796875, -2.060302734375, -1.8980712890625, -1.73583984375, -1.5736083984375, -1.411376953125, -1.2491455078125, -1.0869140625, -0.9246826171875, -0.762451171875, -0.6002197265625, -0.43798828125, -0.2757568359375, -0.113525390625, 0.0487060546875, 0.2109375, 0.3731689453125, 0.535400390625, 0.6976318359375, 0.85986328125, 1.0220947265625, 1.184326171875, 1.3465576171875, 1.5087890625, 1.6710205078125, 1.833251953125, 1.9954833984375, 2.15771484375, 2.3199462890625, 2.482177734375, 2.6444091796875, 2.806640625, 2.9688720703125, 3.131103515625, 3.2933349609375, 3.45556640625, 3.6177978515625, 3.780029296875, 3.9422607421875, 4.1044921875, 4.2667236328125, 4.428955078125, 4.5911865234375, 4.75341796875, 4.9156494140625, 5.077880859375, 5.2401123046875, 5.40234375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 0.0, 2.0, 2.0, 4.0, 2.0, 8.0, 4.0, 7.0, 9.0, 13.0, 12.0, 15.0, 16.0, 20.0, 23.0, 22.0, 42.0, 41.0, 36.0, 33.0, 31.0, 36.0, 32.0, 39.0, 44.0, 36.0, 42.0, 43.0, 50.0, 32.0, 34.0, 26.0, 36.0, 25.0, 24.0, 29.0, 13.0, 28.0, 16.0, 22.0, 13.0, 8.0, 2.0, 8.0, 5.0, 9.0, 2.0, 5.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7421875, -1.6858062744140625, -1.629425048828125, -1.5730438232421875, -1.51666259765625, -1.4602813720703125, -1.403900146484375, -1.3475189208984375, -1.2911376953125, -1.2347564697265625, -1.178375244140625, -1.1219940185546875, -1.06561279296875, -1.0092315673828125, -0.952850341796875, -0.8964691162109375, -0.840087890625, -0.7837066650390625, -0.727325439453125, -0.6709442138671875, -0.61456298828125, -0.5581817626953125, -0.501800537109375, -0.4454193115234375, -0.3890380859375, -0.3326568603515625, -0.276275634765625, -0.2198944091796875, -0.16351318359375, -0.1071319580078125, -0.050750732421875, 0.0056304931640625, 0.06201171875, 0.1183929443359375, 0.174774169921875, 0.2311553955078125, 0.28753662109375, 0.3439178466796875, 0.400299072265625, 0.4566802978515625, 0.5130615234375, 0.5694427490234375, 0.625823974609375, 0.6822052001953125, 0.73858642578125, 0.7949676513671875, 0.851348876953125, 0.9077301025390625, 0.964111328125, 1.0204925537109375, 1.076873779296875, 1.1332550048828125, 1.18963623046875, 1.2460174560546875, 1.302398681640625, 1.3587799072265625, 1.4151611328125, 1.4715423583984375, 1.527923583984375, 1.5843048095703125, 1.64068603515625, 1.6970672607421875, 1.753448486328125, 1.8098297119140625, 1.8662109375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [4.0, 5.0, 5.0, 2.0, 5.0, 4.0, 11.0, 16.0, 13.0, 22.0, 31.0, 37.0, 38.0, 68.0, 83.0, 140.0, 181.0, 278.0, 387.0, 439.0, 739.0, 1068.0, 1641.0, 2694.0, 4312.0, 7382.0, 13625.0, 26909.0, 61681.0, 243344.0, 551219.0, 67736.0, 29456.0, 14407.0, 7893.0, 4540.0, 2711.0, 1702.0, 1157.0, 707.0, 562.0, 346.0, 224.0, 237.0, 116.0, 117.0, 70.0, 45.0, 41.0, 26.0, 28.0, 22.0, 9.0, 9.0, 10.0, 8.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-4.7578125, -4.5994873046875, -4.441162109375, -4.2828369140625, -4.12451171875, -3.9661865234375, -3.807861328125, -3.6495361328125, -3.4912109375, -3.3328857421875, -3.174560546875, -3.0162353515625, -2.85791015625, -2.6995849609375, -2.541259765625, -2.3829345703125, -2.224609375, -2.0662841796875, -1.907958984375, -1.7496337890625, -1.59130859375, -1.4329833984375, -1.274658203125, -1.1163330078125, -0.9580078125, -0.7996826171875, -0.641357421875, -0.4830322265625, -0.32470703125, -0.1663818359375, -0.008056640625, 0.1502685546875, 0.30859375, 0.4669189453125, 0.625244140625, 0.7835693359375, 0.94189453125, 1.1002197265625, 1.258544921875, 1.4168701171875, 1.5751953125, 1.7335205078125, 1.891845703125, 2.0501708984375, 2.20849609375, 2.3668212890625, 2.525146484375, 2.6834716796875, 2.841796875, 3.0001220703125, 3.158447265625, 3.3167724609375, 3.47509765625, 3.6334228515625, 3.791748046875, 3.9500732421875, 4.1083984375, 4.2667236328125, 4.425048828125, 4.5833740234375, 4.74169921875, 4.9000244140625, 5.058349609375, 5.2166748046875, 5.375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 5.0, 2.0, 12.0, 8.0, 16.0, 23.0, 25.0, 43.0, 77.0, 187.0, 324.0, 96.0, 58.0, 41.0, 22.0, 18.0, 12.0, 7.0, 7.0, 5.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0002684593200683594, -0.0002612471580505371, -0.00025403499603271484, -0.0002468228340148926, -0.0002396106719970703, -0.00023239850997924805, -0.00022518634796142578, -0.00021797418594360352, -0.00021076202392578125, -0.00020354986190795898, -0.00019633769989013672, -0.00018912553787231445, -0.0001819133758544922, -0.00017470121383666992, -0.00016748905181884766, -0.0001602768898010254, -0.00015306472778320312, -0.00014585256576538086, -0.0001386404037475586, -0.00013142824172973633, -0.00012421607971191406, -0.0001170039176940918, -0.00010979175567626953, -0.00010257959365844727, -9.5367431640625e-05, -8.815526962280273e-05, -8.094310760498047e-05, -7.37309455871582e-05, -6.651878356933594e-05, -5.930662155151367e-05, -5.2094459533691406e-05, -4.488229751586914e-05, -3.7670135498046875e-05, -3.045797348022461e-05, -2.3245811462402344e-05, -1.6033649444580078e-05, -8.821487426757812e-06, -1.6093254089355469e-06, 5.602836608886719e-06, 1.2814998626708984e-05, 2.002716064453125e-05, 2.7239322662353516e-05, 3.445148468017578e-05, 4.166364669799805e-05, 4.887580871582031e-05, 5.608797073364258e-05, 6.330013275146484e-05, 7.051229476928711e-05, 7.772445678710938e-05, 8.493661880493164e-05, 9.21487808227539e-05, 9.936094284057617e-05, 0.00010657310485839844, 0.0001137852668762207, 0.00012099742889404297, 0.00012820959091186523, 0.0001354217529296875, 0.00014263391494750977, 0.00014984607696533203, 0.0001570582389831543, 0.00016427040100097656, 0.00017148256301879883, 0.0001786947250366211, 0.00018590688705444336, 0.00019311904907226562]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 10.0, 3.0, 10.0, 15.0, 20.0, 19.0, 41.0, 58.0, 84.0, 130.0, 207.0, 312.0, 511.0, 874.0, 1497.0, 2643.0, 4930.0, 10099.0, 23506.0, 68164.0, 686138.0, 174036.0, 42584.0, 16307.0, 7434.0, 3753.0, 2071.0, 1152.0, 719.0, 412.0, 274.0, 194.0, 118.0, 79.0, 44.0, 36.0, 29.0, 16.0, 9.0, 7.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5, -6.2889404296875, -6.077880859375, -5.8668212890625, -5.65576171875, -5.4447021484375, -5.233642578125, -5.0225830078125, -4.8115234375, -4.6004638671875, -4.389404296875, -4.1783447265625, -3.96728515625, -3.7562255859375, -3.545166015625, -3.3341064453125, -3.123046875, -2.9119873046875, -2.700927734375, -2.4898681640625, -2.27880859375, -2.0677490234375, -1.856689453125, -1.6456298828125, -1.4345703125, -1.2235107421875, -1.012451171875, -0.8013916015625, -0.59033203125, -0.3792724609375, -0.168212890625, 0.0428466796875, 0.25390625, 0.4649658203125, 0.676025390625, 0.8870849609375, 1.09814453125, 1.3092041015625, 1.520263671875, 1.7313232421875, 1.9423828125, 2.1534423828125, 2.364501953125, 2.5755615234375, 2.78662109375, 2.9976806640625, 3.208740234375, 3.4197998046875, 3.630859375, 3.8419189453125, 4.052978515625, 4.2640380859375, 4.47509765625, 4.6861572265625, 4.897216796875, 5.1082763671875, 5.3193359375, 5.5303955078125, 5.741455078125, 5.9525146484375, 6.16357421875, 6.3746337890625, 6.585693359375, 6.7967529296875, 7.0078125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 8.0, 7.0, 9.0, 8.0, 18.0, 17.0, 22.0, 27.0, 38.0, 55.0, 48.0, 96.0, 307.0, 81.0, 48.0, 32.0, 37.0, 23.0, 22.0, 15.0, 17.0, 13.0, 10.0, 5.0, 4.0, 6.0, 7.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7509765625, -1.7050933837890625, -1.659210205078125, -1.6133270263671875, -1.56744384765625, -1.5215606689453125, -1.475677490234375, -1.4297943115234375, -1.3839111328125, -1.3380279541015625, -1.292144775390625, -1.2462615966796875, -1.20037841796875, -1.1544952392578125, -1.108612060546875, -1.0627288818359375, -1.016845703125, -0.9709625244140625, -0.925079345703125, -0.8791961669921875, -0.83331298828125, -0.7874298095703125, -0.741546630859375, -0.6956634521484375, -0.6497802734375, -0.6038970947265625, -0.558013916015625, -0.5121307373046875, -0.46624755859375, -0.4203643798828125, -0.374481201171875, -0.3285980224609375, -0.28271484375, -0.2368316650390625, -0.190948486328125, -0.1450653076171875, -0.09918212890625, -0.0532989501953125, -0.007415771484375, 0.0384674072265625, 0.0843505859375, 0.1302337646484375, 0.176116943359375, 0.2220001220703125, 0.26788330078125, 0.3137664794921875, 0.359649658203125, 0.4055328369140625, 0.451416015625, 0.4972991943359375, 0.543182373046875, 0.5890655517578125, 0.63494873046875, 0.6808319091796875, 0.726715087890625, 0.7725982666015625, 0.8184814453125, 0.8643646240234375, 0.910247802734375, 0.9561309814453125, 1.00201416015625, 1.0478973388671875, 1.093780517578125, 1.1396636962890625, 1.185546875]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 3.0, 2.0, 4.0, 6.0, 8.0, 15.0, 17.0, 23.0, 42.0, 56.0, 77.0, 121.0, 140.0, 111.0, 75.0, 70.0, 50.0, 41.0, 32.0, 29.0, 21.0, 13.0, 10.0, 4.0, 8.0, 10.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.094003200531006, -4.946249008178711, -4.798494815826416, -4.650740623474121, -4.502986431121826, -4.355232238769531, -4.2074785232543945, -4.0597243309021, -3.9119701385498047, -3.7642159461975098, -3.616461753845215, -3.46870756149292, -3.320953607559204, -3.173199415206909, -3.0254452228546143, -2.8776912689208984, -2.7299368381500244, -2.5821826457977295, -2.4344284534454346, -2.2866744995117188, -2.138920307159424, -1.991166114807129, -1.843411922454834, -1.6956578493118286, -1.5479036569595337, -1.4001494646072388, -1.2523953914642334, -1.1046411991119385, -0.9568870663642883, -0.8091329336166382, -0.6613787412643433, -0.5136246681213379, -0.36587047576904297, -0.21811632812023163, -0.07036218047142029, 0.07739198207855225, 0.2251461148262024, 0.37290024757385254, 0.5206544399261475, 0.6684085130691528, 0.8161627054214478, 0.9639168381690979, 1.111670970916748, 1.259425163269043, 1.407179355621338, 1.5549334287643433, 1.7026876211166382, 1.8504416942596436, 1.9981958866119385, 2.1459500789642334, 2.2937042713165283, 2.441458225250244, 2.589212417602539, 2.736966609954834, 2.884720802307129, 3.032474994659424, 3.1802291870117188, 3.3279833793640137, 3.4757375717163086, 3.6234917640686035, 3.7712457180023193, 3.9189999103546143, 4.066754341125488, 4.214508056640625, 4.36226224899292]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 5.0, 4.0, 2.0, 4.0, 8.0, 9.0, 10.0, 16.0, 17.0, 9.0, 18.0, 17.0, 10.0, 22.0, 24.0, 26.0, 23.0, 26.0, 33.0, 25.0, 46.0, 32.0, 41.0, 34.0, 50.0, 28.0, 35.0, 34.0, 36.0, 39.0, 33.0, 35.0, 28.0, 28.0, 29.0, 27.0, 20.0, 21.0, 14.0, 16.0, 14.0, 5.0, 14.0, 9.0, 6.0, 6.0, 5.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0], "bins": [-2.9376089572906494, -2.8508334159851074, -2.7640576362609863, -2.6772820949554443, -2.5905065536499023, -2.5037310123443604, -2.4169552326202393, -2.3301796913146973, -2.2434041500091553, -2.1566286087036133, -2.069852828979492, -1.9830772876739502, -1.8963017463684082, -1.8095260858535767, -1.7227504253387451, -1.6359748840332031, -1.5491992235183716, -1.46242356300354, -1.375648021697998, -1.2888723611831665, -1.2020968198776245, -1.115321159362793, -1.028545618057251, -0.9417699575424194, -0.8549943566322327, -0.7682187557220459, -0.6814431548118591, -0.5946675539016724, -0.5078918933868408, -0.42111632227897644, -0.3343406915664673, -0.24756509065628052, -0.16078948974609375, -0.07401388138532639, 0.012761726975440979, 0.09953734278678894, 0.1863129436969757, 0.2730885446071625, 0.35986417531967163, 0.4466397762298584, 0.5334153771400452, 0.6201909780502319, 0.7069665789604187, 0.7937421798706055, 0.880517840385437, 0.967293381690979, 1.0540690422058105, 1.1408445835113525, 1.227620244026184, 1.3143959045410156, 1.4011714458465576, 1.4879471063613892, 1.5747226476669312, 1.6614983081817627, 1.7482738494873047, 1.8350495100021362, 1.9218251705169678, 2.0086007118225098, 2.095376491546631, 2.182152032852173, 2.268927574157715, 2.355703115463257, 2.442478895187378, 2.52925443649292, 2.616029977798462]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 6.0, 6.0, 14.0, 24.0, 29.0, 36.0, 59.0, 96.0, 138.0, 222.0, 303.0, 491.0, 801.0, 1214.0, 1940.0, 2922.0, 4923.0, 8435.0, 13707.0, 24150.0, 45245.0, 89715.0, 213738.0, 852698.0, 2074142.0, 537715.0, 161142.0, 72322.0, 36937.0, 20316.0, 12056.0, 6983.0, 4376.0, 2601.0, 1714.0, 1099.0, 703.0, 467.0, 299.0, 181.0, 107.0, 74.0, 52.0, 35.0, 22.0, 8.0, 8.0, 8.0, 5.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.16015625, -5.01422119140625, -4.8682861328125, -4.72235107421875, -4.576416015625, -4.43048095703125, -4.2845458984375, -4.13861083984375, -3.99267578125, -3.84674072265625, -3.7008056640625, -3.55487060546875, -3.408935546875, -3.26300048828125, -3.1170654296875, -2.97113037109375, -2.8251953125, -2.67926025390625, -2.5333251953125, -2.38739013671875, -2.241455078125, -2.09552001953125, -1.9495849609375, -1.80364990234375, -1.65771484375, -1.51177978515625, -1.3658447265625, -1.21990966796875, -1.073974609375, -0.92803955078125, -0.7821044921875, -0.63616943359375, -0.490234375, -0.34429931640625, -0.1983642578125, -0.05242919921875, 0.093505859375, 0.23944091796875, 0.3853759765625, 0.53131103515625, 0.67724609375, 0.82318115234375, 0.9691162109375, 1.11505126953125, 1.260986328125, 1.40692138671875, 1.5528564453125, 1.69879150390625, 1.8447265625, 1.99066162109375, 2.1365966796875, 2.28253173828125, 2.428466796875, 2.57440185546875, 2.7203369140625, 2.86627197265625, 3.01220703125, 3.15814208984375, 3.3040771484375, 3.45001220703125, 3.595947265625, 3.74188232421875, 3.8878173828125, 4.03375244140625, 4.1796875]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 11.0, 7.0, 14.0, 9.0, 9.0, 16.0, 15.0, 15.0, 24.0, 19.0, 25.0, 25.0, 33.0, 20.0, 31.0, 34.0, 39.0, 36.0, 39.0, 56.0, 39.0, 34.0, 28.0, 35.0, 42.0, 44.0, 31.0, 36.0, 22.0, 20.0, 25.0, 28.0, 26.0, 22.0, 16.0, 9.0, 12.0, 11.0, 6.0, 7.0, 5.0, 7.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0], "bins": [-1.9130859375, -1.8575897216796875, -1.802093505859375, -1.7465972900390625, -1.69110107421875, -1.6356048583984375, -1.580108642578125, -1.5246124267578125, -1.4691162109375, -1.4136199951171875, -1.358123779296875, -1.3026275634765625, -1.24713134765625, -1.1916351318359375, -1.136138916015625, -1.0806427001953125, -1.025146484375, -0.9696502685546875, -0.914154052734375, -0.8586578369140625, -0.80316162109375, -0.7476654052734375, -0.692169189453125, -0.6366729736328125, -0.5811767578125, -0.5256805419921875, -0.470184326171875, -0.4146881103515625, -0.35919189453125, -0.3036956787109375, -0.248199462890625, -0.1927032470703125, -0.13720703125, -0.0817108154296875, -0.026214599609375, 0.0292816162109375, 0.08477783203125, 0.1402740478515625, 0.195770263671875, 0.2512664794921875, 0.3067626953125, 0.3622589111328125, 0.417755126953125, 0.4732513427734375, 0.52874755859375, 0.5842437744140625, 0.639739990234375, 0.6952362060546875, 0.750732421875, 0.8062286376953125, 0.861724853515625, 0.9172210693359375, 0.97271728515625, 1.0282135009765625, 1.083709716796875, 1.1392059326171875, 1.1947021484375, 1.2501983642578125, 1.305694580078125, 1.3611907958984375, 1.41668701171875, 1.4721832275390625, 1.527679443359375, 1.5831756591796875, 1.638671875]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 5.0, 10.0, 15.0, 19.0, 27.0, 45.0, 63.0, 82.0, 173.0, 262.0, 467.0, 797.0, 1433.0, 2661.0, 4881.0, 9573.0, 19983.0, 43893.0, 106204.0, 310404.0, 1353287.0, 1743757.0, 376745.0, 124324.0, 49999.0, 22487.0, 10645.0, 5400.0, 2887.0, 1585.0, 882.0, 495.0, 298.0, 175.0, 124.0, 77.0, 46.0, 20.0, 15.0, 15.0, 11.0, 7.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6171875, -4.46368408203125, -4.3101806640625, -4.15667724609375, -4.003173828125, -3.84967041015625, -3.6961669921875, -3.54266357421875, -3.38916015625, -3.23565673828125, -3.0821533203125, -2.92864990234375, -2.775146484375, -2.62164306640625, -2.4681396484375, -2.31463623046875, -2.1611328125, -2.00762939453125, -1.8541259765625, -1.70062255859375, -1.547119140625, -1.39361572265625, -1.2401123046875, -1.08660888671875, -0.93310546875, -0.77960205078125, -0.6260986328125, -0.47259521484375, -0.319091796875, -0.16558837890625, -0.0120849609375, 0.14141845703125, 0.294921875, 0.44842529296875, 0.6019287109375, 0.75543212890625, 0.908935546875, 1.06243896484375, 1.2159423828125, 1.36944580078125, 1.52294921875, 1.67645263671875, 1.8299560546875, 1.98345947265625, 2.136962890625, 2.29046630859375, 2.4439697265625, 2.59747314453125, 2.7509765625, 2.90447998046875, 3.0579833984375, 3.21148681640625, 3.364990234375, 3.51849365234375, 3.6719970703125, 3.82550048828125, 3.97900390625, 4.13250732421875, 4.2860107421875, 4.43951416015625, 4.593017578125, 4.74652099609375, 4.9000244140625, 5.05352783203125, 5.20703125]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 7.0, 13.0, 11.0, 12.0, 18.0, 26.0, 30.0, 35.0, 51.0, 55.0, 87.0, 82.0, 105.0, 131.0, 191.0, 220.0, 256.0, 304.0, 334.0, 358.0, 305.0, 260.0, 217.0, 177.0, 152.0, 122.0, 105.0, 82.0, 75.0, 56.0, 44.0, 27.0, 24.0, 30.0, 16.0, 17.0, 11.0, 5.0, 7.0, 2.0, 8.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.92138671875, -0.8879928588867188, -0.8545989990234375, -0.8212051391601562, -0.787811279296875, -0.7544174194335938, -0.7210235595703125, -0.6876296997070312, -0.65423583984375, -0.6208419799804688, -0.5874481201171875, -0.5540542602539062, -0.520660400390625, -0.48726654052734375, -0.4538726806640625, -0.42047882080078125, -0.3870849609375, -0.35369110107421875, -0.3202972412109375, -0.28690338134765625, -0.253509521484375, -0.22011566162109375, -0.1867218017578125, -0.15332794189453125, -0.11993408203125, -0.08654022216796875, -0.0531463623046875, -0.01975250244140625, 0.013641357421875, 0.04703521728515625, 0.0804290771484375, 0.11382293701171875, 0.147216796875, 0.18061065673828125, 0.2140045166015625, 0.24739837646484375, 0.280792236328125, 0.31418609619140625, 0.3475799560546875, 0.38097381591796875, 0.41436767578125, 0.44776153564453125, 0.4811553955078125, 0.5145492553710938, 0.547943115234375, 0.5813369750976562, 0.6147308349609375, 0.6481246948242188, 0.6815185546875, 0.7149124145507812, 0.7483062744140625, 0.7817001342773438, 0.815093994140625, 0.8484878540039062, 0.8818817138671875, 0.9152755737304688, 0.94866943359375, 0.9820632934570312, 1.0154571533203125, 1.0488510131835938, 1.082244873046875, 1.1156387329101562, 1.1490325927734375, 1.1824264526367188, 1.2158203125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 4.0, 6.0, 4.0, 8.0, 9.0, 19.0, 18.0, 28.0, 47.0, 71.0, 97.0, 137.0, 160.0, 95.0, 84.0, 50.0, 45.0, 29.0, 21.0, 24.0, 11.0, 17.0, 7.0, 5.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-5.625235557556152, -5.501216888427734, -5.377198696136475, -5.253180027008057, -5.129161357879639, -5.005143165588379, -4.881124496459961, -4.757105827331543, -4.633087635040283, -4.509068965911865, -4.3850507736206055, -4.2610321044921875, -4.1370134353637695, -4.01299524307251, -3.888976573944092, -3.764958143234253, -3.640939474105835, -3.516921043395996, -3.392902374267578, -3.2688839435577393, -3.1448655128479004, -3.0208468437194824, -2.8968284130096436, -2.7728099822998047, -2.6487913131713867, -2.524772882461548, -2.40075421333313, -2.276735782623291, -2.152717351913452, -2.0286989212036133, -1.9046802520751953, -1.7806618213653564, -1.6566436290740967, -1.5326250791549683, -1.4086066484451294, -1.284588098526001, -1.160569667816162, -1.0365511178970337, -0.9125325679779053, -0.7885140776634216, -0.664495587348938, -0.5404770970344543, -0.4164585769176483, -0.2924400568008423, -0.16842156648635864, -0.044403076171875, 0.07961547374725342, 0.20363396406173706, 0.3276524543762207, 0.45167094469070435, 0.575689435005188, 0.6997079849243164, 0.8237264752388, 0.9477449655532837, 1.071763515472412, 1.195781946182251, 1.3198004961013794, 1.4438190460205078, 1.5678374767303467, 1.691856026649475, 1.8158745765686035, 1.9398930072784424, 2.0639114379882812, 2.187930107116699, 2.311948537826538]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 6.0, 4.0, 9.0, 7.0, 13.0, 10.0, 15.0, 13.0, 11.0, 13.0, 22.0, 20.0, 25.0, 26.0, 23.0, 26.0, 35.0, 30.0, 35.0, 38.0, 44.0, 41.0, 36.0, 40.0, 39.0, 41.0, 32.0, 24.0, 33.0, 33.0, 32.0, 35.0, 31.0, 27.0, 22.0, 16.0, 14.0, 15.0, 12.0, 10.0, 7.0, 3.0, 7.0, 7.0, 6.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-2.033118724822998, -1.9688342809677124, -1.9045498371124268, -1.8402655124664307, -1.775981068611145, -1.7116966247558594, -1.6474123001098633, -1.5831278562545776, -1.518843412399292, -1.4545589685440063, -1.3902745246887207, -1.3259902000427246, -1.261705756187439, -1.1974213123321533, -1.1331369876861572, -1.0688525438308716, -1.004568099975586, -0.9402836561203003, -0.8759992718696594, -0.8117148876190186, -0.7474304437637329, -0.6831459999084473, -0.6188616156578064, -0.5545772314071655, -0.4902927875518799, -0.4260083734989166, -0.36172395944595337, -0.2974395453929901, -0.23315513134002686, -0.1688707172870636, -0.10458630323410034, -0.040301889181137085, 0.023982524871826172, 0.08826693892478943, 0.15255135297775269, 0.21683576703071594, 0.2811201810836792, 0.34540459513664246, 0.4096890091896057, 0.47397342324256897, 0.5382578372955322, 0.6025422811508179, 0.6668266654014587, 0.7311110496520996, 0.7953954935073853, 0.8596799373626709, 0.9239643216133118, 0.9882487058639526, 1.0525331497192383, 1.116817593574524, 1.1811020374298096, 1.2453863620758057, 1.3096708059310913, 1.373955249786377, 1.438239574432373, 1.5025240182876587, 1.5668084621429443, 1.63109290599823, 1.6953773498535156, 1.7596616744995117, 1.8239461183547974, 1.888230562210083, 1.952514886856079, 2.0167994499206543, 2.0810837745666504]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 12.0, 13.0, 21.0, 35.0, 47.0, 60.0, 86.0, 130.0, 200.0, 226.0, 348.0, 482.0, 695.0, 973.0, 1473.0, 2215.0, 3538.0, 5604.0, 9290.0, 16521.0, 30973.0, 64943.0, 154121.0, 363416.0, 217360.0, 85688.0, 39437.0, 20659.0, 11131.0, 6638.0, 4137.0, 2591.0, 1732.0, 1140.0, 764.0, 581.0, 369.0, 257.0, 193.0, 130.0, 101.0, 69.0, 42.0, 42.0, 23.0, 18.0, 11.0, 7.0, 6.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0], "bins": [-1.494140625, -1.4484100341796875, -1.402679443359375, -1.3569488525390625, -1.31121826171875, -1.2654876708984375, -1.219757080078125, -1.1740264892578125, -1.1282958984375, -1.0825653076171875, -1.036834716796875, -0.9911041259765625, -0.94537353515625, -0.8996429443359375, -0.853912353515625, -0.8081817626953125, -0.762451171875, -0.7167205810546875, -0.670989990234375, -0.6252593994140625, -0.57952880859375, -0.5337982177734375, -0.488067626953125, -0.4423370361328125, -0.3966064453125, -0.3508758544921875, -0.305145263671875, -0.2594146728515625, -0.21368408203125, -0.1679534912109375, -0.122222900390625, -0.0764923095703125, -0.03076171875, 0.0149688720703125, 0.060699462890625, 0.1064300537109375, 0.15216064453125, 0.1978912353515625, 0.243621826171875, 0.2893524169921875, 0.3350830078125, 0.3808135986328125, 0.426544189453125, 0.4722747802734375, 0.51800537109375, 0.5637359619140625, 0.609466552734375, 0.6551971435546875, 0.700927734375, 0.7466583251953125, 0.792388916015625, 0.8381195068359375, 0.88385009765625, 0.9295806884765625, 0.975311279296875, 1.0210418701171875, 1.0667724609375, 1.1125030517578125, 1.158233642578125, 1.2039642333984375, 1.24969482421875, 1.2954254150390625, 1.341156005859375, 1.3868865966796875, 1.4326171875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 5.0, 3.0, 8.0, 7.0, 9.0, 9.0, 11.0, 8.0, 19.0, 20.0, 10.0, 18.0, 19.0, 35.0, 23.0, 29.0, 33.0, 38.0, 55.0, 45.0, 35.0, 38.0, 56.0, 26.0, 32.0, 48.0, 41.0, 34.0, 45.0, 37.0, 27.0, 49.0, 25.0, 22.0, 9.0, 15.0, 11.0, 9.0, 11.0, 6.0, 5.0, 3.0, 4.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.18359375, -2.11395263671875, -2.0443115234375, -1.97467041015625, -1.905029296875, -1.83538818359375, -1.7657470703125, -1.69610595703125, -1.62646484375, -1.55682373046875, -1.4871826171875, -1.41754150390625, -1.347900390625, -1.27825927734375, -1.2086181640625, -1.13897705078125, -1.0693359375, -0.99969482421875, -0.9300537109375, -0.86041259765625, -0.790771484375, -0.72113037109375, -0.6514892578125, -0.58184814453125, -0.51220703125, -0.44256591796875, -0.3729248046875, -0.30328369140625, -0.233642578125, -0.16400146484375, -0.0943603515625, -0.02471923828125, 0.044921875, 0.11456298828125, 0.1842041015625, 0.25384521484375, 0.323486328125, 0.39312744140625, 0.4627685546875, 0.53240966796875, 0.60205078125, 0.67169189453125, 0.7413330078125, 0.81097412109375, 0.880615234375, 0.95025634765625, 1.0198974609375, 1.08953857421875, 1.1591796875, 1.22882080078125, 1.2984619140625, 1.36810302734375, 1.437744140625, 1.50738525390625, 1.5770263671875, 1.64666748046875, 1.71630859375, 1.78594970703125, 1.8555908203125, 1.92523193359375, 1.994873046875, 2.06451416015625, 2.1341552734375, 2.20379638671875, 2.2734375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 5.0, 16.0, 17.0, 14.0, 23.0, 40.0, 52.0, 77.0, 94.0, 140.0, 189.0, 292.0, 440.0, 626.0, 896.0, 1529.0, 2363.0, 3891.0, 6751.0, 13531.0, 32343.0, 112107.0, 569865.0, 213228.0, 49977.0, 18535.0, 8629.0, 4749.0, 2887.0, 1734.0, 1152.0, 794.0, 433.0, 366.0, 237.0, 164.0, 100.0, 75.0, 57.0, 38.0, 25.0, 15.0, 19.0, 14.0, 9.0, 2.0, 8.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.189453125, -2.11572265625, -2.0419921875, -1.96826171875, -1.89453125, -1.82080078125, -1.7470703125, -1.67333984375, -1.599609375, -1.52587890625, -1.4521484375, -1.37841796875, -1.3046875, -1.23095703125, -1.1572265625, -1.08349609375, -1.009765625, -0.93603515625, -0.8623046875, -0.78857421875, -0.71484375, -0.64111328125, -0.5673828125, -0.49365234375, -0.419921875, -0.34619140625, -0.2724609375, -0.19873046875, -0.125, -0.05126953125, 0.0224609375, 0.09619140625, 0.169921875, 0.24365234375, 0.3173828125, 0.39111328125, 0.46484375, 0.53857421875, 0.6123046875, 0.68603515625, 0.759765625, 0.83349609375, 0.9072265625, 0.98095703125, 1.0546875, 1.12841796875, 1.2021484375, 1.27587890625, 1.349609375, 1.42333984375, 1.4970703125, 1.57080078125, 1.64453125, 1.71826171875, 1.7919921875, 1.86572265625, 1.939453125, 2.01318359375, 2.0869140625, 2.16064453125, 2.234375, 2.30810546875, 2.3818359375, 2.45556640625, 2.529296875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 5.0, 2.0, 8.0, 6.0, 2.0, 10.0, 5.0, 14.0, 8.0, 13.0, 18.0, 17.0, 23.0, 18.0, 35.0, 31.0, 28.0, 36.0, 38.0, 42.0, 46.0, 41.0, 51.0, 36.0, 46.0, 47.0, 35.0, 23.0, 31.0, 49.0, 37.0, 26.0, 30.0, 23.0, 26.0, 26.0, 13.0, 10.0, 9.0, 13.0, 6.0, 3.0, 6.0, 5.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.42578125, -1.3816986083984375, -1.337615966796875, -1.2935333251953125, -1.24945068359375, -1.2053680419921875, -1.161285400390625, -1.1172027587890625, -1.0731201171875, -1.0290374755859375, -0.984954833984375, -0.9408721923828125, -0.89678955078125, -0.8527069091796875, -0.808624267578125, -0.7645416259765625, -0.720458984375, -0.6763763427734375, -0.632293701171875, -0.5882110595703125, -0.54412841796875, -0.5000457763671875, -0.455963134765625, -0.4118804931640625, -0.3677978515625, -0.3237152099609375, -0.279632568359375, -0.2355499267578125, -0.19146728515625, -0.1473846435546875, -0.103302001953125, -0.0592193603515625, -0.01513671875, 0.0289459228515625, 0.073028564453125, 0.1171112060546875, 0.16119384765625, 0.2052764892578125, 0.249359130859375, 0.2934417724609375, 0.3375244140625, 0.3816070556640625, 0.425689697265625, 0.4697723388671875, 0.51385498046875, 0.5579376220703125, 0.602020263671875, 0.6461029052734375, 0.690185546875, 0.7342681884765625, 0.778350830078125, 0.8224334716796875, 0.86651611328125, 0.9105987548828125, 0.954681396484375, 0.9987640380859375, 1.0428466796875, 1.0869293212890625, 1.131011962890625, 1.1750946044921875, 1.21917724609375, 1.2632598876953125, 1.307342529296875, 1.3514251708984375, 1.3955078125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 15.0, 8.0, 13.0, 13.0, 28.0, 36.0, 49.0, 63.0, 125.0, 178.0, 283.0, 453.0, 691.0, 1143.0, 2011.0, 3704.0, 7532.0, 17675.0, 59129.0, 650543.0, 239544.0, 38780.0, 13169.0, 5887.0, 3085.0, 1696.0, 975.0, 586.0, 402.0, 240.0, 162.0, 113.0, 63.0, 52.0, 34.0, 23.0, 14.0, 9.0, 8.0, 7.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.357177734375, -0.3452110290527344, -0.33324432373046875, -0.3212776184082031, -0.3093109130859375, -0.2973442077636719, -0.28537750244140625, -0.2734107971191406, -0.261444091796875, -0.24947738647460938, -0.23751068115234375, -0.22554397583007812, -0.2135772705078125, -0.20161056518554688, -0.18964385986328125, -0.17767715454101562, -0.16571044921875, -0.15374374389648438, -0.14177703857421875, -0.12981033325195312, -0.1178436279296875, -0.10587692260742188, -0.09391021728515625, -0.08194351196289062, -0.069976806640625, -0.058010101318359375, -0.04604339599609375, -0.034076690673828125, -0.0221099853515625, -0.010143280029296875, 0.00182342529296875, 0.013790130615234375, 0.0257568359375, 0.037723541259765625, 0.04969024658203125, 0.061656951904296875, 0.0736236572265625, 0.08559036254882812, 0.09755706787109375, 0.10952377319335938, 0.121490478515625, 0.13345718383789062, 0.14542388916015625, 0.15739059448242188, 0.1693572998046875, 0.18132400512695312, 0.19329071044921875, 0.20525741577148438, 0.21722412109375, 0.22919082641601562, 0.24115753173828125, 0.2531242370605469, 0.2650909423828125, 0.2770576477050781, 0.28902435302734375, 0.3009910583496094, 0.312957763671875, 0.3249244689941406, 0.33689117431640625, 0.3488578796386719, 0.3608245849609375, 0.3727912902832031, 0.38475799560546875, 0.3967247009277344, 0.40869140625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 4.0, 8.0, 7.0, 15.0, 20.0, 17.0, 19.0, 29.0, 51.0, 64.0, 96.0, 126.0, 133.0, 103.0, 87.0, 68.0, 46.0, 24.0, 19.0, 17.0, 7.0, 9.0, 7.0, 1.0, 8.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.895427703857422e-05, -1.841876655817032e-05, -1.788325607776642e-05, -1.734774559736252e-05, -1.6812235116958618e-05, -1.6276724636554718e-05, -1.5741214156150818e-05, -1.5205703675746918e-05, -1.4670193195343018e-05, -1.4134682714939117e-05, -1.3599172234535217e-05, -1.3063661754131317e-05, -1.2528151273727417e-05, -1.1992640793323517e-05, -1.1457130312919617e-05, -1.0921619832515717e-05, -1.0386109352111816e-05, -9.850598871707916e-06, -9.315088391304016e-06, -8.779577910900116e-06, -8.244067430496216e-06, -7.708556950092316e-06, -7.1730464696884155e-06, -6.637535989284515e-06, -6.102025508880615e-06, -5.566515028476715e-06, -5.031004548072815e-06, -4.495494067668915e-06, -3.959983587265015e-06, -3.4244731068611145e-06, -2.8889626264572144e-06, -2.353452146053314e-06, -1.817941665649414e-06, -1.282431185245514e-06, -7.469207048416138e-07, -2.1141022443771362e-07, 3.241002559661865e-07, 8.596107363700867e-07, 1.3951212167739868e-06, 1.930631697177887e-06, 2.466142177581787e-06, 3.0016526579856873e-06, 3.5371631383895874e-06, 4.0726736187934875e-06, 4.608184099197388e-06, 5.143694579601288e-06, 5.679205060005188e-06, 6.214715540409088e-06, 6.750226020812988e-06, 7.2857365012168884e-06, 7.821246981620789e-06, 8.356757462024689e-06, 8.892267942428589e-06, 9.427778422832489e-06, 9.96328890323639e-06, 1.049879938364029e-05, 1.103430986404419e-05, 1.156982034444809e-05, 1.210533082485199e-05, 1.264084130525589e-05, 1.317635178565979e-05, 1.371186226606369e-05, 1.424737274646759e-05, 1.478288322687149e-05, 1.531839370727539e-05]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 3.0, 11.0, 8.0, 23.0, 14.0, 31.0, 44.0, 60.0, 86.0, 93.0, 161.0, 253.0, 363.0, 527.0, 808.0, 1249.0, 2069.0, 3402.0, 5675.0, 9833.0, 18386.0, 35798.0, 76304.0, 208982.0, 446073.0, 125569.0, 53294.0, 26232.0, 13834.0, 7541.0, 4410.0, 2619.0, 1657.0, 1108.0, 665.0, 454.0, 280.0, 198.0, 126.0, 103.0, 64.0, 49.0, 28.0, 25.0, 11.0, 10.0, 6.0, 4.0, 5.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.332763671875, -0.3224525451660156, -0.31214141845703125, -0.3018302917480469, -0.2915191650390625, -0.2812080383300781, -0.27089691162109375, -0.2605857849121094, -0.250274658203125, -0.23996353149414062, -0.22965240478515625, -0.21934127807617188, -0.2090301513671875, -0.19871902465820312, -0.18840789794921875, -0.17809677124023438, -0.16778564453125, -0.15747451782226562, -0.14716339111328125, -0.13685226440429688, -0.1265411376953125, -0.11623001098632812, -0.10591888427734375, -0.09560775756835938, -0.085296630859375, -0.07498550415039062, -0.06467437744140625, -0.054363250732421875, -0.0440521240234375, -0.033740997314453125, -0.02342987060546875, -0.013118743896484375, -0.0028076171875, 0.007503509521484375, 0.01781463623046875, 0.028125762939453125, 0.0384368896484375, 0.048748016357421875, 0.05905914306640625, 0.06937026977539062, 0.079681396484375, 0.08999252319335938, 0.10030364990234375, 0.11061477661132812, 0.1209259033203125, 0.13123703002929688, 0.14154815673828125, 0.15185928344726562, 0.16217041015625, 0.17248153686523438, 0.18279266357421875, 0.19310379028320312, 0.2034149169921875, 0.21372604370117188, 0.22403717041015625, 0.23434829711914062, 0.244659423828125, 0.2549705505371094, 0.26528167724609375, 0.2755928039550781, 0.2859039306640625, 0.2962150573730469, 0.30652618408203125, 0.3168373107910156, 0.3271484375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 5.0, 4.0, 10.0, 7.0, 16.0, 13.0, 15.0, 27.0, 25.0, 27.0, 36.0, 31.0, 33.0, 45.0, 50.0, 62.0, 57.0, 87.0, 53.0, 66.0, 60.0, 41.0, 35.0, 34.0, 22.0, 29.0, 16.0, 26.0, 7.0, 11.0, 5.0, 11.0, 9.0, 6.0, 1.0, 3.0, 1.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1005859375, -0.09765434265136719, -0.09472274780273438, -0.09179115295410156, -0.08885955810546875, -0.08592796325683594, -0.08299636840820312, -0.08006477355957031, -0.0771331787109375, -0.07420158386230469, -0.07126998901367188, -0.06833839416503906, -0.06540679931640625, -0.06247520446777344, -0.059543609619140625, -0.05661201477050781, -0.053680419921875, -0.05074882507324219, -0.047817230224609375, -0.04488563537597656, -0.04195404052734375, -0.03902244567871094, -0.036090850830078125, -0.03315925598144531, -0.0302276611328125, -0.027296066284179688, -0.024364471435546875, -0.021432876586914062, -0.01850128173828125, -0.015569686889648438, -0.012638092041015625, -0.009706497192382812, -0.00677490234375, -0.0038433074951171875, -0.000911712646484375, 0.0020198822021484375, 0.00495147705078125, 0.007883071899414062, 0.010814666748046875, 0.013746261596679688, 0.0166778564453125, 0.019609451293945312, 0.022541046142578125, 0.025472640991210938, 0.02840423583984375, 0.03133583068847656, 0.034267425537109375, 0.03719902038574219, 0.040130615234375, 0.04306221008300781, 0.045993804931640625, 0.04892539978027344, 0.05185699462890625, 0.05478858947753906, 0.057720184326171875, 0.06065177917480469, 0.0635833740234375, 0.06651496887207031, 0.06944656372070312, 0.07237815856933594, 0.07530975341796875, 0.07824134826660156, 0.08117294311523438, 0.08410453796386719, 0.0870361328125]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 7.0, 6.0, 13.0, 17.0, 17.0, 28.0, 45.0, 65.0, 102.0, 140.0, 130.0, 105.0, 78.0, 62.0, 42.0, 21.0, 25.0, 25.0, 17.0, 15.0, 15.0, 7.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 3.0], "bins": [-5.211032390594482, -5.093585014343262, -4.976137638092041, -4.858689785003662, -4.741242408752441, -4.623795032501221, -4.50634765625, -4.388899803161621, -4.2714524269104, -4.15400505065918, -4.036557674407959, -3.919110059738159, -3.8016624450683594, -3.6842150688171387, -3.566767692565918, -3.449320077896118, -3.3318727016448975, -3.2144253253936768, -3.096977710723877, -2.9795303344726562, -2.8620827198028564, -2.7446353435516357, -2.627187728881836, -2.5097403526306152, -2.3922929763793945, -2.274845600128174, -2.157397985458374, -2.0399506092071533, -1.9225029945373535, -1.8050556182861328, -1.6876081228256226, -1.5701606273651123, -1.4527132511138916, -1.3352657556533813, -1.217818260192871, -1.1003708839416504, -0.9829233288764954, -0.8654758334159851, -0.7480283975601196, -0.6305809020996094, -0.5131334066390991, -0.39568591117858887, -0.278238445520401, -0.16079097986221313, -0.04334348440170288, 0.07410401105880737, 0.19155144691467285, 0.3089989423751831, 0.42644643783569336, 0.5438939332962036, 0.6613414287567139, 0.7787888646125793, 0.8962363600730896, 1.013683795928955, 1.1311312913894653, 1.2485787868499756, 1.3660262823104858, 1.483473777770996, 1.6009212732315063, 1.7183687686920166, 1.8358161449432373, 1.953263759613037, 2.070711135864258, 2.1881585121154785, 2.3056061267852783]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 9.0, 4.0, 6.0, 9.0, 7.0, 15.0, 11.0, 12.0, 11.0, 17.0, 9.0, 20.0, 25.0, 25.0, 24.0, 23.0, 34.0, 31.0, 33.0, 39.0, 40.0, 42.0, 37.0, 41.0, 41.0, 39.0, 37.0, 27.0, 36.0, 27.0, 34.0, 34.0, 33.0, 34.0, 26.0, 9.0, 25.0, 13.0, 13.0, 10.0, 10.0, 3.0, 5.0, 4.0, 10.0, 4.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-2.0459110736846924, -1.9807226657867432, -1.915534257888794, -1.8503458499908447, -1.7851574420928955, -1.7199690341949463, -1.654780626296997, -1.5895922183990479, -1.5244038105010986, -1.4592154026031494, -1.3940269947052002, -1.328838586807251, -1.2636501789093018, -1.1984617710113525, -1.1332733631134033, -1.068084955215454, -1.0028965473175049, -0.9377081394195557, -0.8725197315216064, -0.8073313236236572, -0.742142915725708, -0.6769545078277588, -0.6117660999298096, -0.5465776920318604, -0.48138928413391113, -0.4162008762359619, -0.3510124683380127, -0.2858240604400635, -0.22063565254211426, -0.15544724464416504, -0.09025883674621582, -0.0250704288482666, 0.04011797904968262, 0.10530638694763184, 0.17049479484558105, 0.23568320274353027, 0.3008716106414795, 0.3660600185394287, 0.43124842643737793, 0.49643683433532715, 0.5616252422332764, 0.6268136501312256, 0.6920020580291748, 0.757190465927124, 0.8223788738250732, 0.8875672817230225, 0.9527556896209717, 1.017944097518921, 1.0831325054168701, 1.1483209133148193, 1.2135093212127686, 1.2786977291107178, 1.343886137008667, 1.4090745449066162, 1.4742629528045654, 1.5394513607025146, 1.6046397686004639, 1.669828176498413, 1.7350165843963623, 1.8002049922943115, 1.8653934001922607, 1.93058180809021, 1.9957702159881592, 2.0609586238861084, 2.1261470317840576]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 8.0, 10.0, 12.0, 20.0, 27.0, 40.0, 69.0, 76.0, 102.0, 169.0, 201.0, 297.0, 431.0, 631.0, 849.0, 1312.0, 1902.0, 2793.0, 4344.0, 6826.0, 11239.0, 18217.0, 30994.0, 53417.0, 93411.0, 166659.0, 245916.0, 173113.0, 97276.0, 55129.0, 31682.0, 19011.0, 11522.0, 7252.0, 4440.0, 2952.0, 1983.0, 1335.0, 880.0, 576.0, 425.0, 288.0, 227.0, 136.0, 106.0, 77.0, 59.0, 29.0, 36.0, 19.0, 16.0, 5.0, 7.0, 5.0, 2.0, 1.0, 2.0, 3.0], "bins": [-3.349609375, -3.24664306640625, -3.1436767578125, -3.04071044921875, -2.937744140625, -2.83477783203125, -2.7318115234375, -2.62884521484375, -2.52587890625, -2.42291259765625, -2.3199462890625, -2.21697998046875, -2.114013671875, -2.01104736328125, -1.9080810546875, -1.80511474609375, -1.7021484375, -1.59918212890625, -1.4962158203125, -1.39324951171875, -1.290283203125, -1.18731689453125, -1.0843505859375, -0.98138427734375, -0.87841796875, -0.77545166015625, -0.6724853515625, -0.56951904296875, -0.466552734375, -0.36358642578125, -0.2606201171875, -0.15765380859375, -0.0546875, 0.04827880859375, 0.1512451171875, 0.25421142578125, 0.357177734375, 0.46014404296875, 0.5631103515625, 0.66607666015625, 0.76904296875, 0.87200927734375, 0.9749755859375, 1.07794189453125, 1.180908203125, 1.28387451171875, 1.3868408203125, 1.48980712890625, 1.5927734375, 1.69573974609375, 1.7987060546875, 1.90167236328125, 2.004638671875, 2.10760498046875, 2.2105712890625, 2.31353759765625, 2.41650390625, 2.51947021484375, 2.6224365234375, 2.72540283203125, 2.828369140625, 2.93133544921875, 3.0343017578125, 3.13726806640625, 3.240234375]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 8.0, 8.0, 5.0, 4.0, 10.0, 8.0, 14.0, 13.0, 17.0, 18.0, 20.0, 28.0, 25.0, 31.0, 22.0, 31.0, 22.0, 46.0, 36.0, 47.0, 31.0, 53.0, 44.0, 43.0, 39.0, 27.0, 48.0, 35.0, 30.0, 29.0, 33.0, 25.0, 28.0, 22.0, 15.0, 23.0, 12.0, 12.0, 10.0, 4.0, 3.0, 2.0, 7.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.8173828125, -1.75872802734375, -1.7000732421875, -1.64141845703125, -1.582763671875, -1.52410888671875, -1.4654541015625, -1.40679931640625, -1.34814453125, -1.28948974609375, -1.2308349609375, -1.17218017578125, -1.113525390625, -1.05487060546875, -0.9962158203125, -0.93756103515625, -0.87890625, -0.82025146484375, -0.7615966796875, -0.70294189453125, -0.644287109375, -0.58563232421875, -0.5269775390625, -0.46832275390625, -0.40966796875, -0.35101318359375, -0.2923583984375, -0.23370361328125, -0.175048828125, -0.11639404296875, -0.0577392578125, 0.00091552734375, 0.0595703125, 0.11822509765625, 0.1768798828125, 0.23553466796875, 0.294189453125, 0.35284423828125, 0.4114990234375, 0.47015380859375, 0.52880859375, 0.58746337890625, 0.6461181640625, 0.70477294921875, 0.763427734375, 0.82208251953125, 0.8807373046875, 0.93939208984375, 0.998046875, 1.05670166015625, 1.1153564453125, 1.17401123046875, 1.232666015625, 1.29132080078125, 1.3499755859375, 1.40863037109375, 1.46728515625, 1.52593994140625, 1.5845947265625, 1.64324951171875, 1.701904296875, 1.76055908203125, 1.8192138671875, 1.87786865234375, 1.9365234375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 11.0, 5.0, 19.0, 21.0, 15.0, 41.0, 62.0, 106.0, 123.0, 187.0, 315.0, 479.0, 837.0, 1293.0, 2149.0, 3639.0, 6101.0, 10884.0, 19521.0, 35842.0, 67491.0, 131018.0, 250309.0, 245397.0, 126616.0, 66563.0, 34913.0, 18827.0, 10593.0, 6025.0, 3600.0, 2055.0, 1282.0, 775.0, 509.0, 312.0, 219.0, 140.0, 80.0, 59.0, 41.0, 23.0, 10.0, 13.0, 16.0, 7.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.462890625, -3.347381591796875, -3.23187255859375, -3.116363525390625, -3.0008544921875, -2.885345458984375, -2.76983642578125, -2.654327392578125, -2.538818359375, -2.423309326171875, -2.30780029296875, -2.192291259765625, -2.0767822265625, -1.961273193359375, -1.84576416015625, -1.730255126953125, -1.61474609375, -1.499237060546875, -1.38372802734375, -1.268218994140625, -1.1527099609375, -1.037200927734375, -0.92169189453125, -0.806182861328125, -0.690673828125, -0.575164794921875, -0.45965576171875, -0.344146728515625, -0.2286376953125, -0.113128662109375, 0.00238037109375, 0.117889404296875, 0.2333984375, 0.348907470703125, 0.46441650390625, 0.579925537109375, 0.6954345703125, 0.810943603515625, 0.92645263671875, 1.041961669921875, 1.157470703125, 1.272979736328125, 1.38848876953125, 1.503997802734375, 1.6195068359375, 1.735015869140625, 1.85052490234375, 1.966033935546875, 2.08154296875, 2.197052001953125, 2.31256103515625, 2.428070068359375, 2.5435791015625, 2.659088134765625, 2.77459716796875, 2.890106201171875, 3.005615234375, 3.121124267578125, 3.23663330078125, 3.352142333984375, 3.4676513671875, 3.583160400390625, 3.69866943359375, 3.814178466796875, 3.9296875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 3.0, 7.0, 6.0, 6.0, 6.0, 12.0, 10.0, 20.0, 23.0, 20.0, 20.0, 26.0, 28.0, 36.0, 40.0, 32.0, 32.0, 27.0, 54.0, 40.0, 37.0, 48.0, 56.0, 41.0, 55.0, 38.0, 35.0, 39.0, 32.0, 26.0, 16.0, 22.0, 25.0, 11.0, 19.0, 14.0, 13.0, 5.0, 9.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3173828125, -1.2744903564453125, -1.231597900390625, -1.1887054443359375, -1.14581298828125, -1.1029205322265625, -1.060028076171875, -1.0171356201171875, -0.9742431640625, -0.9313507080078125, -0.888458251953125, -0.8455657958984375, -0.80267333984375, -0.7597808837890625, -0.716888427734375, -0.6739959716796875, -0.631103515625, -0.5882110595703125, -0.545318603515625, -0.5024261474609375, -0.45953369140625, -0.4166412353515625, -0.373748779296875, -0.3308563232421875, -0.2879638671875, -0.2450714111328125, -0.202178955078125, -0.1592864990234375, -0.11639404296875, -0.0735015869140625, -0.030609130859375, 0.0122833251953125, 0.05517578125, 0.0980682373046875, 0.140960693359375, 0.1838531494140625, 0.22674560546875, 0.2696380615234375, 0.312530517578125, 0.3554229736328125, 0.3983154296875, 0.4412078857421875, 0.484100341796875, 0.5269927978515625, 0.56988525390625, 0.6127777099609375, 0.655670166015625, 0.6985626220703125, 0.741455078125, 0.7843475341796875, 0.827239990234375, 0.8701324462890625, 0.91302490234375, 0.9559173583984375, 0.998809814453125, 1.0417022705078125, 1.0845947265625, 1.1274871826171875, 1.170379638671875, 1.2132720947265625, 1.25616455078125, 1.2990570068359375, 1.341949462890625, 1.3848419189453125, 1.427734375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 5.0, 8.0, 11.0, 13.0, 16.0, 24.0, 28.0, 38.0, 67.0, 85.0, 98.0, 145.0, 202.0, 267.0, 381.0, 562.0, 864.0, 1256.0, 1948.0, 3221.0, 5216.0, 9133.0, 16882.0, 34630.0, 102122.0, 753548.0, 59375.0, 25771.0, 13202.0, 7370.0, 4310.0, 2609.0, 1645.0, 1065.0, 712.0, 478.0, 367.0, 234.0, 171.0, 144.0, 85.0, 72.0, 52.0, 42.0, 27.0, 22.0, 13.0, 8.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.66796875, -2.576934814453125, -2.48590087890625, -2.394866943359375, -2.3038330078125, -2.212799072265625, -2.12176513671875, -2.030731201171875, -1.939697265625, -1.848663330078125, -1.75762939453125, -1.666595458984375, -1.5755615234375, -1.484527587890625, -1.39349365234375, -1.302459716796875, -1.21142578125, -1.120391845703125, -1.02935791015625, -0.938323974609375, -0.8472900390625, -0.756256103515625, -0.66522216796875, -0.574188232421875, -0.483154296875, -0.392120361328125, -0.30108642578125, -0.210052490234375, -0.1190185546875, -0.027984619140625, 0.06304931640625, 0.154083251953125, 0.2451171875, 0.336151123046875, 0.42718505859375, 0.518218994140625, 0.6092529296875, 0.700286865234375, 0.79132080078125, 0.882354736328125, 0.973388671875, 1.064422607421875, 1.15545654296875, 1.246490478515625, 1.3375244140625, 1.428558349609375, 1.51959228515625, 1.610626220703125, 1.70166015625, 1.792694091796875, 1.88372802734375, 1.974761962890625, 2.0657958984375, 2.156829833984375, 2.24786376953125, 2.338897705078125, 2.429931640625, 2.520965576171875, 2.61199951171875, 2.703033447265625, 2.7940673828125, 2.885101318359375, 2.97613525390625, 3.067169189453125, 3.158203125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 8.0, 5.0, 1.0, 17.0, 21.0, 16.0, 27.0, 46.0, 104.0, 396.0, 172.0, 64.0, 31.0, 19.0, 17.0, 12.0, 9.0, 6.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0001442432403564453, -0.00014078151434659958, -0.00013731978833675385, -0.0001338580623269081, -0.00013039633631706238, -0.00012693461030721664, -0.0001234728842973709, -0.00012001115828752518, -0.00011654943227767944, -0.00011308770626783371, -0.00010962598025798798, -0.00010616425424814224, -0.00010270252823829651, -9.924080222845078e-05, -9.577907621860504e-05, -9.231735020875931e-05, -8.885562419891357e-05, -8.539389818906784e-05, -8.193217217922211e-05, -7.847044616937637e-05, -7.500872015953064e-05, -7.15469941496849e-05, -6.808526813983917e-05, -6.462354212999344e-05, -6.11618161201477e-05, -5.770009011030197e-05, -5.423836410045624e-05, -5.0776638090610504e-05, -4.731491208076477e-05, -4.385318607091904e-05, -4.03914600610733e-05, -3.692973405122757e-05, -3.3468008041381836e-05, -3.0006282031536102e-05, -2.654455602169037e-05, -2.3082830011844635e-05, -1.96211040019989e-05, -1.6159377992153168e-05, -1.2697651982307434e-05, -9.2359259724617e-06, -5.774199962615967e-06, -2.312473952770233e-06, 1.1492520570755005e-06, 4.610978066921234e-06, 8.072704076766968e-06, 1.1534430086612701e-05, 1.4996156096458435e-05, 1.845788210630417e-05, 2.1919608116149902e-05, 2.5381334125995636e-05, 2.884306013584137e-05, 3.23047861456871e-05, 3.576651215553284e-05, 3.922823816537857e-05, 4.2689964175224304e-05, 4.615169018507004e-05, 4.961341619491577e-05, 5.3075142204761505e-05, 5.653686821460724e-05, 5.999859422445297e-05, 6.34603202342987e-05, 6.692204624414444e-05, 7.038377225399017e-05, 7.384549826383591e-05, 7.730722427368164e-05]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 6.0, 9.0, 16.0, 27.0, 40.0, 47.0, 70.0, 101.0, 151.0, 248.0, 387.0, 600.0, 1026.0, 1636.0, 2809.0, 4876.0, 9091.0, 17509.0, 39031.0, 230657.0, 655061.0, 43511.0, 19070.0, 9701.0, 5235.0, 2997.0, 1765.0, 1085.0, 609.0, 396.0, 265.0, 168.0, 103.0, 76.0, 61.0, 40.0, 17.0, 13.0, 14.0, 10.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.388671875, -3.286163330078125, -3.18365478515625, -3.081146240234375, -2.9786376953125, -2.876129150390625, -2.77362060546875, -2.671112060546875, -2.568603515625, -2.466094970703125, -2.36358642578125, -2.261077880859375, -2.1585693359375, -2.056060791015625, -1.95355224609375, -1.851043701171875, -1.74853515625, -1.646026611328125, -1.54351806640625, -1.441009521484375, -1.3385009765625, -1.235992431640625, -1.13348388671875, -1.030975341796875, -0.928466796875, -0.825958251953125, -0.72344970703125, -0.620941162109375, -0.5184326171875, -0.415924072265625, -0.31341552734375, -0.210906982421875, -0.1083984375, -0.005889892578125, 0.09661865234375, 0.199127197265625, 0.3016357421875, 0.404144287109375, 0.50665283203125, 0.609161376953125, 0.711669921875, 0.814178466796875, 0.91668701171875, 1.019195556640625, 1.1217041015625, 1.224212646484375, 1.32672119140625, 1.429229736328125, 1.53173828125, 1.634246826171875, 1.73675537109375, 1.839263916015625, 1.9417724609375, 2.044281005859375, 2.14678955078125, 2.249298095703125, 2.351806640625, 2.454315185546875, 2.55682373046875, 2.659332275390625, 2.7618408203125, 2.864349365234375, 2.96685791015625, 3.069366455078125, 3.171875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 4.0, 6.0, 1.0, 14.0, 5.0, 9.0, 24.0, 18.0, 15.0, 27.0, 27.0, 42.0, 249.0, 328.0, 60.0, 25.0, 24.0, 16.0, 14.0, 14.0, 13.0, 14.0, 9.0, 4.0, 11.0, 4.0, 4.0, 6.0, 7.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80517578125, -0.7792434692382812, -0.7533111572265625, -0.7273788452148438, -0.701446533203125, -0.6755142211914062, -0.6495819091796875, -0.6236495971679688, -0.59771728515625, -0.5717849731445312, -0.5458526611328125, -0.5199203491210938, -0.493988037109375, -0.46805572509765625, -0.4421234130859375, -0.41619110107421875, -0.3902587890625, -0.36432647705078125, -0.3383941650390625, -0.31246185302734375, -0.286529541015625, -0.26059722900390625, -0.2346649169921875, -0.20873260498046875, -0.18280029296875, -0.15686798095703125, -0.1309356689453125, -0.10500335693359375, -0.079071044921875, -0.05313873291015625, -0.0272064208984375, -0.00127410888671875, 0.024658203125, 0.05059051513671875, 0.0765228271484375, 0.10245513916015625, 0.128387451171875, 0.15431976318359375, 0.1802520751953125, 0.20618438720703125, 0.23211669921875, 0.25804901123046875, 0.2839813232421875, 0.30991363525390625, 0.335845947265625, 0.36177825927734375, 0.3877105712890625, 0.41364288330078125, 0.4395751953125, 0.46550750732421875, 0.4914398193359375, 0.5173721313476562, 0.543304443359375, 0.5692367553710938, 0.5951690673828125, 0.6211013793945312, 0.64703369140625, 0.6729660034179688, 0.6988983154296875, 0.7248306274414062, 0.750762939453125, 0.7766952514648438, 0.8026275634765625, 0.8285598754882812, 0.8544921875]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 6.0, 6.0, 7.0, 17.0, 13.0, 21.0, 31.0, 48.0, 70.0, 103.0, 131.0, 127.0, 113.0, 75.0, 53.0, 46.0, 31.0, 27.0, 16.0, 15.0, 13.0, 5.0, 9.0, 4.0, 9.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.322625160217285, -4.217809200286865, -4.112993240356445, -4.008177280426025, -3.9033610820770264, -3.7985451221466064, -3.6937291622161865, -3.5889132022857666, -3.4840970039367676, -3.3792810440063477, -3.2744650840759277, -3.169649124145508, -3.064832925796509, -2.960016965866089, -2.855201005935669, -2.750385046005249, -2.645569086074829, -2.540753126144409, -2.4359371662139893, -2.3311209678649902, -2.2263050079345703, -2.1214890480041504, -2.0166730880737305, -1.9118571281433105, -1.807041049003601, -1.7022250890731812, -1.5974090099334717, -1.4925930500030518, -1.3877770900726318, -1.2829610109329224, -1.1781450510025024, -1.073328971862793, -0.9685132503509521, -0.8636972308158875, -0.7588812112808228, -0.6540652513504028, -0.5492492318153381, -0.44443321228027344, -0.3396172523498535, -0.23480123281478882, -0.12998521327972412, -0.025169208645820618, 0.07964679598808289, 0.1844627857208252, 0.2892788052558899, 0.3940948247909546, 0.4989107847213745, 0.6037268042564392, 0.7085428237915039, 0.8133588433265686, 0.9181748628616333, 1.0229908227920532, 1.1278069019317627, 1.2326228618621826, 1.3374388217926025, 1.4422547817230225, 1.547070860862732, 1.6518868207931519, 1.7567028999328613, 1.8615188598632812, 1.9663348197937012, 2.071150779724121, 2.175966739654541, 2.28078293800354, 2.38559889793396]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 1.0, 3.0, 2.0, 6.0, 7.0, 7.0, 3.0, 3.0, 10.0, 11.0, 12.0, 12.0, 12.0, 23.0, 23.0, 24.0, 20.0, 29.0, 17.0, 27.0, 28.0, 25.0, 39.0, 37.0, 43.0, 39.0, 42.0, 33.0, 38.0, 42.0, 37.0, 40.0, 32.0, 35.0, 29.0, 28.0, 25.0, 29.0, 18.0, 23.0, 23.0, 9.0, 9.0, 9.0, 7.0, 9.0, 5.0, 3.0, 4.0, 4.0, 6.0, 2.0, 1.0, 3.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8004070520401, -1.7410697937011719, -1.6817326545715332, -1.622395396232605, -1.5630581378936768, -1.5037208795547485, -1.4443836212158203, -1.3850464820861816, -1.3257092237472534, -1.2663719654083252, -1.2070348262786865, -1.1476975679397583, -1.08836030960083, -1.0290230512619019, -0.9696858525276184, -0.910348653793335, -0.8510113954544067, -0.7916741371154785, -0.7323369383811951, -0.6729997396469116, -0.6136624813079834, -0.5543252229690552, -0.49498802423477173, -0.4356507956981659, -0.37631356716156006, -0.3169763386249542, -0.2576391100883484, -0.19830188155174255, -0.13896465301513672, -0.07962742447853088, -0.02029019594192505, 0.039047032594680786, 0.09838414192199707, 0.1577213704586029, 0.21705859899520874, 0.2763958275318146, 0.3357330560684204, 0.39507028460502625, 0.4544075131416321, 0.5137447118759155, 0.5730819702148438, 0.632419228553772, 0.6917564272880554, 0.7510936260223389, 0.8104308843612671, 0.8697681427001953, 0.9291053414344788, 0.9884425401687622, 1.0477797985076904, 1.1071170568466187, 1.1664543151855469, 1.2257914543151855, 1.2851287126541138, 1.344465970993042, 1.4038031101226807, 1.4631403684616089, 1.522477626800537, 1.5818148851394653, 1.6411521434783936, 1.7004892826080322, 1.7598265409469604, 1.8191637992858887, 1.8785009384155273, 1.9378381967544556, 1.9971754550933838]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 6.0, 11.0, 12.0, 20.0, 18.0, 25.0, 35.0, 48.0, 69.0, 80.0, 126.0, 171.0, 243.0, 360.0, 411.0, 600.0, 872.0, 1324.0, 1911.0, 2730.0, 4091.0, 6152.0, 9480.0, 14890.0, 24642.0, 41716.0, 77018.0, 161018.0, 456014.0, 1669976.0, 1142767.0, 295667.0, 122901.0, 62924.0, 35547.0, 21252.0, 13288.0, 8324.0, 5476.0, 3680.0, 2560.0, 1727.0, 1230.0, 821.0, 596.0, 406.0, 322.0, 209.0, 168.0, 107.0, 77.0, 53.0, 47.0, 26.0, 19.0, 12.0, 12.0, 4.0, 2.0, 3.0], "bins": [-2.833984375, -2.750213623046875, -2.66644287109375, -2.582672119140625, -2.4989013671875, -2.415130615234375, -2.33135986328125, -2.247589111328125, -2.163818359375, -2.080047607421875, -1.99627685546875, -1.912506103515625, -1.8287353515625, -1.744964599609375, -1.66119384765625, -1.577423095703125, -1.49365234375, -1.409881591796875, -1.32611083984375, -1.242340087890625, -1.1585693359375, -1.074798583984375, -0.99102783203125, -0.907257080078125, -0.823486328125, -0.739715576171875, -0.65594482421875, -0.572174072265625, -0.4884033203125, -0.404632568359375, -0.32086181640625, -0.237091064453125, -0.1533203125, -0.069549560546875, 0.01422119140625, 0.097991943359375, 0.1817626953125, 0.265533447265625, 0.34930419921875, 0.433074951171875, 0.516845703125, 0.600616455078125, 0.68438720703125, 0.768157958984375, 0.8519287109375, 0.935699462890625, 1.01947021484375, 1.103240966796875, 1.18701171875, 1.270782470703125, 1.35455322265625, 1.438323974609375, 1.5220947265625, 1.605865478515625, 1.68963623046875, 1.773406982421875, 1.857177734375, 1.940948486328125, 2.02471923828125, 2.108489990234375, 2.1922607421875, 2.276031494140625, 2.35980224609375, 2.443572998046875, 2.52734375]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 8.0, 4.0, 2.0, 9.0, 4.0, 5.0, 13.0, 7.0, 16.0, 15.0, 14.0, 19.0, 14.0, 17.0, 21.0, 39.0, 27.0, 30.0, 33.0, 37.0, 35.0, 39.0, 37.0, 46.0, 40.0, 27.0, 35.0, 50.0, 46.0, 30.0, 35.0, 36.0, 27.0, 26.0, 22.0, 30.0, 22.0, 15.0, 11.0, 6.0, 8.0, 13.0, 6.0, 7.0, 8.0, 5.0, 3.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.240234375, -1.2017822265625, -1.163330078125, -1.1248779296875, -1.08642578125, -1.0479736328125, -1.009521484375, -0.9710693359375, -0.9326171875, -0.8941650390625, -0.855712890625, -0.8172607421875, -0.77880859375, -0.7403564453125, -0.701904296875, -0.6634521484375, -0.625, -0.5865478515625, -0.548095703125, -0.5096435546875, -0.47119140625, -0.4327392578125, -0.394287109375, -0.3558349609375, -0.3173828125, -0.2789306640625, -0.240478515625, -0.2020263671875, -0.16357421875, -0.1251220703125, -0.086669921875, -0.0482177734375, -0.009765625, 0.0286865234375, 0.067138671875, 0.1055908203125, 0.14404296875, 0.1824951171875, 0.220947265625, 0.2593994140625, 0.2978515625, 0.3363037109375, 0.374755859375, 0.4132080078125, 0.45166015625, 0.4901123046875, 0.528564453125, 0.5670166015625, 0.60546875, 0.6439208984375, 0.682373046875, 0.7208251953125, 0.75927734375, 0.7977294921875, 0.836181640625, 0.8746337890625, 0.9130859375, 0.9515380859375, 0.989990234375, 1.0284423828125, 1.06689453125, 1.1053466796875, 1.143798828125, 1.1822509765625, 1.220703125]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 8.0, 13.0, 15.0, 18.0, 38.0, 52.0, 87.0, 94.0, 166.0, 237.0, 323.0, 482.0, 781.0, 1225.0, 1767.0, 2834.0, 4550.0, 7675.0, 13186.0, 23323.0, 43947.0, 87688.0, 190559.0, 490379.0, 1596396.0, 1085570.0, 346911.0, 144130.0, 68852.0, 35280.0, 19157.0, 10989.0, 6529.0, 4044.0, 2466.0, 1520.0, 964.0, 658.0, 442.0, 326.0, 200.0, 128.0, 82.0, 58.0, 45.0, 29.0, 17.0, 23.0, 8.0, 3.0, 7.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.546875, -2.46929931640625, -2.3917236328125, -2.31414794921875, -2.236572265625, -2.15899658203125, -2.0814208984375, -2.00384521484375, -1.92626953125, -1.84869384765625, -1.7711181640625, -1.69354248046875, -1.615966796875, -1.53839111328125, -1.4608154296875, -1.38323974609375, -1.3056640625, -1.22808837890625, -1.1505126953125, -1.07293701171875, -0.995361328125, -0.91778564453125, -0.8402099609375, -0.76263427734375, -0.68505859375, -0.60748291015625, -0.5299072265625, -0.45233154296875, -0.374755859375, -0.29718017578125, -0.2196044921875, -0.14202880859375, -0.064453125, 0.01312255859375, 0.0906982421875, 0.16827392578125, 0.245849609375, 0.32342529296875, 0.4010009765625, 0.47857666015625, 0.55615234375, 0.63372802734375, 0.7113037109375, 0.78887939453125, 0.866455078125, 0.94403076171875, 1.0216064453125, 1.09918212890625, 1.1767578125, 1.25433349609375, 1.3319091796875, 1.40948486328125, 1.487060546875, 1.56463623046875, 1.6422119140625, 1.71978759765625, 1.79736328125, 1.87493896484375, 1.9525146484375, 2.03009033203125, 2.107666015625, 2.18524169921875, 2.2628173828125, 2.34039306640625, 2.41796875]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 6.0, 4.0, 8.0, 8.0, 10.0, 8.0, 22.0, 29.0, 38.0, 35.0, 42.0, 56.0, 67.0, 84.0, 117.0, 117.0, 151.0, 199.0, 215.0, 239.0, 274.0, 295.0, 300.0, 270.0, 235.0, 205.0, 209.0, 131.0, 131.0, 122.0, 91.0, 58.0, 46.0, 53.0, 43.0, 27.0, 33.0, 21.0, 10.0, 13.0, 13.0, 13.0, 6.0, 3.0, 8.0, 4.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.64892578125, -0.6274948120117188, -0.6060638427734375, -0.5846328735351562, -0.563201904296875, -0.5417709350585938, -0.5203399658203125, -0.49890899658203125, -0.47747802734375, -0.45604705810546875, -0.4346160888671875, -0.41318511962890625, -0.391754150390625, -0.37032318115234375, -0.3488922119140625, -0.32746124267578125, -0.3060302734375, -0.28459930419921875, -0.2631683349609375, -0.24173736572265625, -0.220306396484375, -0.19887542724609375, -0.1774444580078125, -0.15601348876953125, -0.13458251953125, -0.11315155029296875, -0.0917205810546875, -0.07028961181640625, -0.048858642578125, -0.02742767333984375, -0.0059967041015625, 0.01543426513671875, 0.036865234375, 0.05829620361328125, 0.0797271728515625, 0.10115814208984375, 0.122589111328125, 0.14402008056640625, 0.1654510498046875, 0.18688201904296875, 0.20831298828125, 0.22974395751953125, 0.2511749267578125, 0.27260589599609375, 0.294036865234375, 0.31546783447265625, 0.3368988037109375, 0.35832977294921875, 0.3797607421875, 0.40119171142578125, 0.4226226806640625, 0.44405364990234375, 0.465484619140625, 0.48691558837890625, 0.5083465576171875, 0.5297775268554688, 0.55120849609375, 0.5726394653320312, 0.5940704345703125, 0.6155014038085938, 0.636932373046875, 0.6583633422851562, 0.6797943115234375, 0.7012252807617188, 0.72265625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 11.0, 8.0, 19.0, 16.0, 26.0, 33.0, 52.0, 66.0, 108.0, 122.0, 129.0, 95.0, 75.0, 62.0, 41.0, 30.0, 30.0, 16.0, 14.0, 15.0, 12.0, 6.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 3.0], "bins": [-3.228182554244995, -3.153517007827759, -3.0788512229919434, -3.004185676574707, -2.9295201301574707, -2.8548545837402344, -2.780188798904419, -2.7055232524871826, -2.630857467651367, -2.556191921234131, -2.4815261363983154, -2.406860589981079, -2.3321950435638428, -2.2575292587280273, -2.182863712310791, -2.1081981658935547, -2.0335326194763184, -1.9588669538497925, -1.8842014074325562, -1.8095357418060303, -1.734870195388794, -1.660204529762268, -1.5855388641357422, -1.5108733177185059, -1.43620765209198, -1.361541986465454, -1.2868764400482178, -1.212210774421692, -1.137545108795166, -1.0628795623779297, -0.9882138967514038, -0.9135482907295227, -0.8388824462890625, -0.7642168402671814, -0.6895512342453003, -0.6148855686187744, -0.5402199625968933, -0.4655543565750122, -0.3908887207508087, -0.3162230849266052, -0.24155747890472412, -0.16689185798168182, -0.09222623705863953, -0.01756061613559723, 0.05710500478744507, 0.13177061080932617, 0.20643624663352966, 0.28110188245773315, 0.35576748847961426, 0.43043309450149536, 0.5050987005233765, 0.5797643661499023, 0.6544299721717834, 0.7290955781936646, 0.8037612438201904, 0.8784268498420715, 0.9530924558639526, 1.0277581214904785, 1.1024236679077148, 1.1770893335342407, 1.2517549991607666, 1.326420545578003, 1.4010862112045288, 1.4757518768310547, 1.550417423248291]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 8.0, 2.0, 5.0, 11.0, 6.0, 8.0, 9.0, 17.0, 18.0, 17.0, 19.0, 22.0, 36.0, 24.0, 29.0, 32.0, 25.0, 32.0, 33.0, 38.0, 44.0, 41.0, 52.0, 53.0, 40.0, 35.0, 33.0, 36.0, 35.0, 38.0, 35.0, 22.0, 24.0, 20.0, 23.0, 12.0, 14.0, 13.0, 11.0, 8.0, 8.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 4.0], "bins": [-1.6920973062515259, -1.643949270248413, -1.5958012342453003, -1.5476531982421875, -1.4995052814483643, -1.4513572454452515, -1.4032092094421387, -1.3550611734390259, -1.306913137435913, -1.2587651014328003, -1.2106170654296875, -1.1624691486358643, -1.1143211126327515, -1.0661730766296387, -1.0180250406265259, -0.9698770046234131, -0.9217290282249451, -0.8735809922218323, -0.8254330158233643, -0.7772849798202515, -0.7291369438171387, -0.6809889078140259, -0.6328409314155579, -0.5846928954124451, -0.536544919013977, -0.48839691281318665, -0.44024887681007385, -0.39210087060928345, -0.34395283460617065, -0.29580482840538025, -0.24765682220458984, -0.19950878620147705, -0.15136075019836426, -0.10321272909641266, -0.055064715445041656, -0.006916701793670654, 0.041231319308280945, 0.08937934041023254, 0.13752734661102295, 0.18567538261413574, 0.23382338881492615, 0.28197139501571655, 0.33011943101882935, 0.37826743721961975, 0.42641544342041016, 0.47456347942352295, 0.5227115154266357, 0.5708595514297485, 0.6190075278282166, 0.6671555638313293, 0.7153035402297974, 0.7634515762329102, 0.811599612236023, 0.8597476482391357, 0.9078956246376038, 0.9560436606407166, 1.0041916370391846, 1.0523396730422974, 1.1004877090454102, 1.1486356258392334, 1.1967836618423462, 1.244931697845459, 1.2930797338485718, 1.3412277698516846, 1.3893758058547974]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 9.0, 12.0, 22.0, 29.0, 37.0, 42.0, 64.0, 78.0, 138.0, 191.0, 278.0, 406.0, 556.0, 880.0, 1287.0, 1930.0, 2802.0, 4554.0, 6948.0, 11206.0, 18632.0, 32188.0, 58603.0, 113200.0, 224103.0, 264896.0, 138536.0, 70963.0, 38092.0, 21944.0, 12914.0, 7932.0, 5103.0, 3360.0, 2109.0, 1431.0, 980.0, 657.0, 430.0, 309.0, 195.0, 151.0, 104.0, 76.0, 60.0, 37.0, 32.0, 13.0, 17.0, 6.0, 4.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0], "bins": [-0.7431640625, -0.7200469970703125, -0.696929931640625, -0.6738128662109375, -0.65069580078125, -0.6275787353515625, -0.604461669921875, -0.5813446044921875, -0.5582275390625, -0.5351104736328125, -0.511993408203125, -0.4888763427734375, -0.46575927734375, -0.4426422119140625, -0.419525146484375, -0.3964080810546875, -0.373291015625, -0.3501739501953125, -0.327056884765625, -0.3039398193359375, -0.28082275390625, -0.2577056884765625, -0.234588623046875, -0.2114715576171875, -0.1883544921875, -0.1652374267578125, -0.142120361328125, -0.1190032958984375, -0.09588623046875, -0.0727691650390625, -0.049652099609375, -0.0265350341796875, -0.00341796875, 0.0196990966796875, 0.042816162109375, 0.0659332275390625, 0.08905029296875, 0.1121673583984375, 0.135284423828125, 0.1584014892578125, 0.1815185546875, 0.2046356201171875, 0.227752685546875, 0.2508697509765625, 0.27398681640625, 0.2971038818359375, 0.320220947265625, 0.3433380126953125, 0.366455078125, 0.3895721435546875, 0.412689208984375, 0.4358062744140625, 0.45892333984375, 0.4820404052734375, 0.505157470703125, 0.5282745361328125, 0.5513916015625, 0.5745086669921875, 0.597625732421875, 0.6207427978515625, 0.64385986328125, 0.6669769287109375, 0.690093994140625, 0.7132110595703125, 0.736328125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 8.0, 3.0, 7.0, 9.0, 8.0, 11.0, 16.0, 14.0, 23.0, 19.0, 23.0, 26.0, 38.0, 20.0, 39.0, 36.0, 34.0, 39.0, 36.0, 48.0, 54.0, 48.0, 45.0, 50.0, 29.0, 39.0, 43.0, 41.0, 24.0, 28.0, 26.0, 14.0, 18.0, 23.0, 13.0, 14.0, 4.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.708984375, -1.6580810546875, -1.607177734375, -1.5562744140625, -1.50537109375, -1.4544677734375, -1.403564453125, -1.3526611328125, -1.3017578125, -1.2508544921875, -1.199951171875, -1.1490478515625, -1.09814453125, -1.0472412109375, -0.996337890625, -0.9454345703125, -0.89453125, -0.8436279296875, -0.792724609375, -0.7418212890625, -0.69091796875, -0.6400146484375, -0.589111328125, -0.5382080078125, -0.4873046875, -0.4364013671875, -0.385498046875, -0.3345947265625, -0.28369140625, -0.2327880859375, -0.181884765625, -0.1309814453125, -0.080078125, -0.0291748046875, 0.021728515625, 0.0726318359375, 0.12353515625, 0.1744384765625, 0.225341796875, 0.2762451171875, 0.3271484375, 0.3780517578125, 0.428955078125, 0.4798583984375, 0.53076171875, 0.5816650390625, 0.632568359375, 0.6834716796875, 0.734375, 0.7852783203125, 0.836181640625, 0.8870849609375, 0.93798828125, 0.9888916015625, 1.039794921875, 1.0906982421875, 1.1416015625, 1.1925048828125, 1.243408203125, 1.2943115234375, 1.34521484375, 1.3961181640625, 1.447021484375, 1.4979248046875, 1.548828125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 3.0, 4.0, 2.0, 0.0, 7.0, 3.0, 8.0, 13.0, 17.0, 17.0, 30.0, 47.0, 60.0, 79.0, 112.0, 181.0, 223.0, 359.0, 489.0, 653.0, 1012.0, 1484.0, 2198.0, 3301.0, 5434.0, 9723.0, 18796.0, 44787.0, 134636.0, 490616.0, 215684.0, 63122.0, 25048.0, 11832.0, 6636.0, 3908.0, 2572.0, 1713.0, 1113.0, 814.0, 557.0, 359.0, 246.0, 190.0, 129.0, 95.0, 57.0, 55.0, 40.0, 35.0, 28.0, 13.0, 6.0, 6.0, 7.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0], "bins": [-1.185546875, -1.149261474609375, -1.11297607421875, -1.076690673828125, -1.0404052734375, -1.004119873046875, -0.96783447265625, -0.931549072265625, -0.895263671875, -0.858978271484375, -0.82269287109375, -0.786407470703125, -0.7501220703125, -0.713836669921875, -0.67755126953125, -0.641265869140625, -0.60498046875, -0.568695068359375, -0.53240966796875, -0.496124267578125, -0.4598388671875, -0.423553466796875, -0.38726806640625, -0.350982666015625, -0.314697265625, -0.278411865234375, -0.24212646484375, -0.205841064453125, -0.1695556640625, -0.133270263671875, -0.09698486328125, -0.060699462890625, -0.0244140625, 0.011871337890625, 0.04815673828125, 0.084442138671875, 0.1207275390625, 0.157012939453125, 0.19329833984375, 0.229583740234375, 0.265869140625, 0.302154541015625, 0.33843994140625, 0.374725341796875, 0.4110107421875, 0.447296142578125, 0.48358154296875, 0.519866943359375, 0.55615234375, 0.592437744140625, 0.62872314453125, 0.665008544921875, 0.7012939453125, 0.737579345703125, 0.77386474609375, 0.810150146484375, 0.846435546875, 0.882720947265625, 0.91900634765625, 0.955291748046875, 0.9915771484375, 1.027862548828125, 1.06414794921875, 1.100433349609375, 1.13671875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 6.0, 3.0, 5.0, 6.0, 7.0, 17.0, 11.0, 17.0, 16.0, 19.0, 24.0, 36.0, 26.0, 23.0, 29.0, 31.0, 39.0, 41.0, 51.0, 41.0, 45.0, 44.0, 43.0, 42.0, 44.0, 37.0, 39.0, 34.0, 30.0, 28.0, 20.0, 25.0, 20.0, 22.0, 11.0, 16.0, 8.0, 12.0, 13.0, 6.0, 1.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-1.0830078125, -1.0519638061523438, -1.0209197998046875, -0.9898757934570312, -0.958831787109375, -0.9277877807617188, -0.8967437744140625, -0.8656997680664062, -0.83465576171875, -0.8036117553710938, -0.7725677490234375, -0.7415237426757812, -0.710479736328125, -0.6794357299804688, -0.6483917236328125, -0.6173477172851562, -0.5863037109375, -0.5552597045898438, -0.5242156982421875, -0.49317169189453125, -0.462127685546875, -0.43108367919921875, -0.4000396728515625, -0.36899566650390625, -0.33795166015625, -0.30690765380859375, -0.2758636474609375, -0.24481964111328125, -0.213775634765625, -0.18273162841796875, -0.1516876220703125, -0.12064361572265625, -0.089599609375, -0.05855560302734375, -0.0275115966796875, 0.00353240966796875, 0.034576416015625, 0.06562042236328125, 0.0966644287109375, 0.12770843505859375, 0.15875244140625, 0.18979644775390625, 0.2208404541015625, 0.25188446044921875, 0.282928466796875, 0.31397247314453125, 0.3450164794921875, 0.37606048583984375, 0.4071044921875, 0.43814849853515625, 0.4691925048828125, 0.5002365112304688, 0.531280517578125, 0.5623245239257812, 0.5933685302734375, 0.6244125366210938, 0.65545654296875, 0.6865005493164062, 0.7175445556640625, 0.7485885620117188, 0.779632568359375, 0.8106765747070312, 0.8417205810546875, 0.8727645874023438, 0.90380859375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 7.0, 5.0, 4.0, 11.0, 11.0, 24.0, 40.0, 59.0, 111.0, 241.0, 348.0, 635.0, 1225.0, 2494.0, 5868.0, 18400.0, 101979.0, 815632.0, 76110.0, 15356.0, 5213.0, 2276.0, 1127.0, 572.0, 333.0, 174.0, 107.0, 65.0, 47.0, 16.0, 18.0, 9.0, 7.0, 3.0, 4.0, 1.0, 7.0, 5.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.283203125, -0.2749786376953125, -0.266754150390625, -0.2585296630859375, -0.25030517578125, -0.2420806884765625, -0.233856201171875, -0.2256317138671875, -0.2174072265625, -0.2091827392578125, -0.200958251953125, -0.1927337646484375, -0.18450927734375, -0.1762847900390625, -0.168060302734375, -0.1598358154296875, -0.151611328125, -0.1433868408203125, -0.135162353515625, -0.1269378662109375, -0.11871337890625, -0.1104888916015625, -0.102264404296875, -0.0940399169921875, -0.0858154296875, -0.0775909423828125, -0.069366455078125, -0.0611419677734375, -0.05291748046875, -0.0446929931640625, -0.036468505859375, -0.0282440185546875, -0.02001953125, -0.0117950439453125, -0.003570556640625, 0.0046539306640625, 0.01287841796875, 0.0211029052734375, 0.029327392578125, 0.0375518798828125, 0.0457763671875, 0.0540008544921875, 0.062225341796875, 0.0704498291015625, 0.07867431640625, 0.0868988037109375, 0.095123291015625, 0.1033477783203125, 0.111572265625, 0.1197967529296875, 0.128021240234375, 0.1362457275390625, 0.14447021484375, 0.1526947021484375, 0.160919189453125, 0.1691436767578125, 0.1773681640625, 0.1855926513671875, 0.193817138671875, 0.2020416259765625, 0.21026611328125, 0.2184906005859375, 0.226715087890625, 0.2349395751953125, 0.2431640625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 8.0, 14.0, 10.0, 14.0, 19.0, 35.0, 34.0, 62.0, 69.0, 99.0, 132.0, 122.0, 88.0, 77.0, 62.0, 38.0, 17.0, 19.0, 17.0, 11.0, 9.0, 11.0, 5.0, 2.0, 0.0, 5.0, 4.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.702278137207031e-06, -8.409842848777771e-06, -8.11740756034851e-06, -7.82497227191925e-06, -7.53253698348999e-06, -7.24010169506073e-06, -6.94766640663147e-06, -6.6552311182022095e-06, -6.362795829772949e-06, -6.070360541343689e-06, -5.777925252914429e-06, -5.4854899644851685e-06, -5.193054676055908e-06, -4.900619387626648e-06, -4.608184099197388e-06, -4.3157488107681274e-06, -4.023313522338867e-06, -3.730878233909607e-06, -3.4384429454803467e-06, -3.1460076570510864e-06, -2.853572368621826e-06, -2.561137080192566e-06, -2.2687017917633057e-06, -1.9762665033340454e-06, -1.6838312149047852e-06, -1.391395926475525e-06, -1.0989606380462646e-06, -8.065253496170044e-07, -5.140900611877441e-07, -2.2165477275848389e-07, 7.078051567077637e-08, 3.632158041000366e-07, 6.556510925292969e-07, 9.480863809585571e-07, 1.2405216693878174e-06, 1.5329569578170776e-06, 1.8253922462463379e-06, 2.117827534675598e-06, 2.4102628231048584e-06, 2.7026981115341187e-06, 2.995133399963379e-06, 3.287568688392639e-06, 3.5800039768218994e-06, 3.87243926525116e-06, 4.16487455368042e-06, 4.45730984210968e-06, 4.7497451305389404e-06, 5.042180418968201e-06, 5.334615707397461e-06, 5.627050995826721e-06, 5.9194862842559814e-06, 6.211921572685242e-06, 6.504356861114502e-06, 6.796792149543762e-06, 7.0892274379730225e-06, 7.381662726402283e-06, 7.674098014831543e-06, 7.966533303260803e-06, 8.258968591690063e-06, 8.551403880119324e-06, 8.843839168548584e-06, 9.136274456977844e-06, 9.428709745407104e-06, 9.721145033836365e-06, 1.0013580322265625e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 17.0, 14.0, 14.0, 40.0, 61.0, 44.0, 80.0, 113.0, 192.0, 249.0, 395.0, 579.0, 884.0, 1393.0, 2344.0, 4145.0, 6915.0, 13354.0, 27278.0, 63336.0, 180914.0, 486524.0, 151807.0, 55013.0, 24494.0, 12076.0, 6624.0, 3593.0, 2207.0, 1289.0, 825.0, 556.0, 371.0, 252.0, 152.0, 123.0, 85.0, 51.0, 41.0, 33.0, 15.0, 14.0, 14.0, 10.0, 3.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.1158447265625, -0.111907958984375, -0.10797119140625, -0.104034423828125, -0.10009765625, -0.096160888671875, -0.09222412109375, -0.088287353515625, -0.0843505859375, -0.080413818359375, -0.07647705078125, -0.072540283203125, -0.068603515625, -0.064666748046875, -0.06072998046875, -0.056793212890625, -0.0528564453125, -0.048919677734375, -0.04498291015625, -0.041046142578125, -0.037109375, -0.033172607421875, -0.02923583984375, -0.025299072265625, -0.0213623046875, -0.017425537109375, -0.01348876953125, -0.009552001953125, -0.005615234375, -0.001678466796875, 0.00225830078125, 0.006195068359375, 0.0101318359375, 0.014068603515625, 0.01800537109375, 0.021942138671875, 0.02587890625, 0.029815673828125, 0.03375244140625, 0.037689208984375, 0.0416259765625, 0.045562744140625, 0.04949951171875, 0.053436279296875, 0.057373046875, 0.061309814453125, 0.06524658203125, 0.069183349609375, 0.0731201171875, 0.077056884765625, 0.08099365234375, 0.084930419921875, 0.0888671875, 0.092803955078125, 0.09674072265625, 0.100677490234375, 0.1046142578125, 0.108551025390625, 0.11248779296875, 0.116424560546875, 0.120361328125, 0.124298095703125, 0.12823486328125, 0.132171630859375, 0.1361083984375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 3.0, 1.0, 4.0, 6.0, 8.0, 10.0, 16.0, 16.0, 22.0, 32.0, 30.0, 59.0, 65.0, 99.0, 141.0, 149.0, 98.0, 56.0, 46.0, 29.0, 19.0, 19.0, 19.0, 10.0, 9.0, 7.0, 5.0, 8.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0694580078125, -0.06746768951416016, -0.06547737121582031, -0.06348705291748047, -0.061496734619140625, -0.05950641632080078, -0.05751609802246094, -0.055525779724121094, -0.05353546142578125, -0.051545143127441406, -0.04955482482910156, -0.04756450653076172, -0.045574188232421875, -0.04358386993408203, -0.04159355163574219, -0.039603233337402344, -0.0376129150390625, -0.035622596740722656, -0.03363227844238281, -0.03164196014404297, -0.029651641845703125, -0.02766132354736328, -0.025671005249023438, -0.023680686950683594, -0.02169036865234375, -0.019700050354003906, -0.017709732055664062, -0.01571941375732422, -0.013729095458984375, -0.011738777160644531, -0.009748458862304688, -0.007758140563964844, -0.005767822265625, -0.0037775039672851562, -0.0017871856689453125, 0.00020313262939453125, 0.002193450927734375, 0.004183769226074219, 0.0061740875244140625, 0.008164405822753906, 0.01015472412109375, 0.012145042419433594, 0.014135360717773438, 0.01612567901611328, 0.018115997314453125, 0.02010631561279297, 0.022096633911132812, 0.024086952209472656, 0.0260772705078125, 0.028067588806152344, 0.030057907104492188, 0.03204822540283203, 0.034038543701171875, 0.03602886199951172, 0.03801918029785156, 0.040009498596191406, 0.04199981689453125, 0.043990135192871094, 0.04598045349121094, 0.04797077178955078, 0.049961090087890625, 0.05195140838623047, 0.05394172668457031, 0.055932044982910156, 0.05792236328125]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 11.0, 16.0, 18.0, 24.0, 38.0, 60.0, 71.0, 100.0, 126.0, 130.0, 105.0, 64.0, 64.0, 36.0, 24.0, 27.0, 22.0, 9.0, 19.0, 8.0, 5.0, 1.0, 1.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.2400801181793213, -3.164761781692505, -3.0894434452056885, -3.014125108718872, -2.9388067722320557, -2.86348819732666, -2.7881698608398438, -2.7128515243530273, -2.637533187866211, -2.5622148513793945, -2.486896514892578, -2.4115781784057617, -2.3362598419189453, -2.260941505432129, -2.1856231689453125, -2.110304594039917, -2.0349864959716797, -1.9596681594848633, -1.8843498229980469, -1.8090314865112305, -1.7337130308151245, -1.658394694328308, -1.5830763578414917, -1.5077579021453857, -1.4324395656585693, -1.357121229171753, -1.2818028926849365, -1.2064845561981201, -1.1311661005020142, -1.0558477640151978, -0.9805294275283813, -0.9052110314369202, -0.8298927545547485, -0.7545744180679321, -0.679256021976471, -0.6039376854896545, -0.5286192893981934, -0.45330095291137695, -0.37798261642456055, -0.30266422033309937, -0.22734588384628296, -0.15202751755714417, -0.07670916616916656, -0.0013908147811889648, 0.07392755150794983, 0.14924591779708862, 0.22456425428390503, 0.2998826503753662, 0.3752009868621826, 0.4505193531513214, 0.5258377194404602, 0.6011560559272766, 0.6764744520187378, 0.7517927885055542, 0.8271111249923706, 0.9024295210838318, 0.9777478575706482, 1.0530662536621094, 1.1283845901489258, 1.2037029266357422, 1.2790212631225586, 1.354339599609375, 1.4296579360961914, 1.5049763917922974, 1.5802947282791138]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 8.0, 1.0, 6.0, 6.0, 9.0, 12.0, 3.0, 22.0, 14.0, 18.0, 18.0, 20.0, 39.0, 25.0, 28.0, 31.0, 24.0, 36.0, 38.0, 29.0, 45.0, 45.0, 48.0, 55.0, 36.0, 38.0, 34.0, 37.0, 37.0, 37.0, 35.0, 22.0, 25.0, 18.0, 25.0, 12.0, 15.0, 9.0, 11.0, 9.0, 8.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 4.0], "bins": [-1.682024598121643, -1.6340625286102295, -1.5861003398895264, -1.5381382703781128, -1.4901762008666992, -1.4422141313552856, -1.394252061843872, -1.346289873123169, -1.2983278036117554, -1.2503657341003418, -1.2024035453796387, -1.154441475868225, -1.1064794063568115, -1.058517336845398, -1.0105552673339844, -0.9625930786132812, -0.9146310091018677, -0.8666689395904541, -0.8187068104743958, -0.7707446813583374, -0.7227826118469238, -0.6748205423355103, -0.6268584132194519, -0.5788962841033936, -0.53093421459198, -0.482972115278244, -0.43501001596450806, -0.3870479166507721, -0.33908581733703613, -0.29112371802330017, -0.2431616187095642, -0.19519951939582825, -0.14723742008209229, -0.09927532076835632, -0.05131322145462036, -0.0033511221408843994, 0.04461097717285156, 0.09257307648658752, 0.1405351758003235, 0.18849727511405945, 0.2364593744277954, 0.28442147374153137, 0.33238357305526733, 0.3803456723690033, 0.42830777168273926, 0.4762698709964752, 0.5242319703102112, 0.5721940994262695, 0.6201561689376831, 0.6681182384490967, 0.716080367565155, 0.7640424966812134, 0.812004566192627, 0.8599666357040405, 0.9079287648200989, 0.9558908939361572, 1.0038529634475708, 1.0518150329589844, 1.0997772216796875, 1.147739291191101, 1.1957013607025146, 1.2436634302139282, 1.2916254997253418, 1.339587688446045, 1.3875497579574585]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 3.0, 8.0, 8.0, 10.0, 19.0, 34.0, 38.0, 54.0, 98.0, 108.0, 160.0, 212.0, 297.0, 400.0, 642.0, 997.0, 1424.0, 2158.0, 3393.0, 5267.0, 8287.0, 13691.0, 22612.0, 39116.0, 69540.0, 128403.0, 230395.0, 228074.0, 126603.0, 68302.0, 38661.0, 22562.0, 13567.0, 8148.0, 5254.0, 3330.0, 2151.0, 1442.0, 997.0, 629.0, 402.0, 311.0, 207.0, 158.0, 114.0, 80.0, 56.0, 53.0, 26.0, 25.0, 11.0, 7.0, 3.0, 7.0, 4.0, 6.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.15625, -2.086669921875, -2.01708984375, -1.947509765625, -1.8779296875, -1.808349609375, -1.73876953125, -1.669189453125, -1.599609375, -1.530029296875, -1.46044921875, -1.390869140625, -1.3212890625, -1.251708984375, -1.18212890625, -1.112548828125, -1.04296875, -0.973388671875, -0.90380859375, -0.834228515625, -0.7646484375, -0.695068359375, -0.62548828125, -0.555908203125, -0.486328125, -0.416748046875, -0.34716796875, -0.277587890625, -0.2080078125, -0.138427734375, -0.06884765625, 0.000732421875, 0.0703125, 0.139892578125, 0.20947265625, 0.279052734375, 0.3486328125, 0.418212890625, 0.48779296875, 0.557373046875, 0.626953125, 0.696533203125, 0.76611328125, 0.835693359375, 0.9052734375, 0.974853515625, 1.04443359375, 1.114013671875, 1.18359375, 1.253173828125, 1.32275390625, 1.392333984375, 1.4619140625, 1.531494140625, 1.60107421875, 1.670654296875, 1.740234375, 1.809814453125, 1.87939453125, 1.948974609375, 2.0185546875, 2.088134765625, 2.15771484375, 2.227294921875, 2.296875]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 8.0, 1.0, 8.0, 4.0, 3.0, 13.0, 10.0, 12.0, 14.0, 24.0, 27.0, 29.0, 28.0, 26.0, 26.0, 32.0, 34.0, 37.0, 38.0, 40.0, 46.0, 62.0, 50.0, 37.0, 42.0, 41.0, 40.0, 35.0, 40.0, 30.0, 33.0, 20.0, 25.0, 22.0, 11.0, 12.0, 12.0, 7.0, 5.0, 5.0, 5.0, 1.0, 1.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.5322265625, -1.4876708984375, -1.443115234375, -1.3985595703125, -1.35400390625, -1.3094482421875, -1.264892578125, -1.2203369140625, -1.17578125, -1.1312255859375, -1.086669921875, -1.0421142578125, -0.99755859375, -0.9530029296875, -0.908447265625, -0.8638916015625, -0.8193359375, -0.7747802734375, -0.730224609375, -0.6856689453125, -0.64111328125, -0.5965576171875, -0.552001953125, -0.5074462890625, -0.462890625, -0.4183349609375, -0.373779296875, -0.3292236328125, -0.28466796875, -0.2401123046875, -0.195556640625, -0.1510009765625, -0.1064453125, -0.0618896484375, -0.017333984375, 0.0272216796875, 0.07177734375, 0.1163330078125, 0.160888671875, 0.2054443359375, 0.25, 0.2945556640625, 0.339111328125, 0.3836669921875, 0.42822265625, 0.4727783203125, 0.517333984375, 0.5618896484375, 0.6064453125, 0.6510009765625, 0.695556640625, 0.7401123046875, 0.78466796875, 0.8292236328125, 0.873779296875, 0.9183349609375, 0.962890625, 1.0074462890625, 1.052001953125, 1.0965576171875, 1.14111328125, 1.1856689453125, 1.230224609375, 1.2747802734375, 1.3193359375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 5.0, 9.0, 9.0, 24.0, 17.0, 33.0, 60.0, 110.0, 163.0, 331.0, 535.0, 965.0, 1859.0, 3685.0, 7557.0, 16653.0, 39446.0, 106038.0, 317182.0, 354956.0, 119430.0, 44401.0, 18348.0, 8349.0, 4006.0, 1920.0, 1083.0, 580.0, 328.0, 179.0, 107.0, 73.0, 43.0, 24.0, 20.0, 13.0, 5.0, 5.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6953125, -3.580047607421875, -3.46478271484375, -3.349517822265625, -3.2342529296875, -3.118988037109375, -3.00372314453125, -2.888458251953125, -2.773193359375, -2.657928466796875, -2.54266357421875, -2.427398681640625, -2.3121337890625, -2.196868896484375, -2.08160400390625, -1.966339111328125, -1.85107421875, -1.735809326171875, -1.62054443359375, -1.505279541015625, -1.3900146484375, -1.274749755859375, -1.15948486328125, -1.044219970703125, -0.928955078125, -0.813690185546875, -0.69842529296875, -0.583160400390625, -0.4678955078125, -0.352630615234375, -0.23736572265625, -0.122100830078125, -0.0068359375, 0.108428955078125, 0.22369384765625, 0.338958740234375, 0.4542236328125, 0.569488525390625, 0.68475341796875, 0.800018310546875, 0.915283203125, 1.030548095703125, 1.14581298828125, 1.261077880859375, 1.3763427734375, 1.491607666015625, 1.60687255859375, 1.722137451171875, 1.83740234375, 1.952667236328125, 2.06793212890625, 2.183197021484375, 2.2984619140625, 2.413726806640625, 2.52899169921875, 2.644256591796875, 2.759521484375, 2.874786376953125, 2.99005126953125, 3.105316162109375, 3.2205810546875, 3.335845947265625, 3.45111083984375, 3.566375732421875, 3.681640625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 8.0, 11.0, 10.0, 15.0, 15.0, 18.0, 30.0, 32.0, 29.0, 37.0, 46.0, 53.0, 52.0, 43.0, 56.0, 47.0, 54.0, 58.0, 41.0, 48.0, 49.0, 28.0, 38.0, 25.0, 22.0, 27.0, 26.0, 17.0, 9.0, 17.0, 6.0, 8.0, 12.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1484375, -1.1145782470703125, -1.080718994140625, -1.0468597412109375, -1.01300048828125, -0.9791412353515625, -0.945281982421875, -0.9114227294921875, -0.8775634765625, -0.8437042236328125, -0.809844970703125, -0.7759857177734375, -0.74212646484375, -0.7082672119140625, -0.674407958984375, -0.6405487060546875, -0.606689453125, -0.5728302001953125, -0.538970947265625, -0.5051116943359375, -0.47125244140625, -0.4373931884765625, -0.403533935546875, -0.3696746826171875, -0.3358154296875, -0.3019561767578125, -0.268096923828125, -0.2342376708984375, -0.20037841796875, -0.1665191650390625, -0.132659912109375, -0.0988006591796875, -0.06494140625, -0.0310821533203125, 0.002777099609375, 0.0366363525390625, 0.07049560546875, 0.1043548583984375, 0.138214111328125, 0.1720733642578125, 0.2059326171875, 0.2397918701171875, 0.273651123046875, 0.3075103759765625, 0.34136962890625, 0.3752288818359375, 0.409088134765625, 0.4429473876953125, 0.476806640625, 0.5106658935546875, 0.544525146484375, 0.5783843994140625, 0.61224365234375, 0.6461029052734375, 0.679962158203125, 0.7138214111328125, 0.7476806640625, 0.7815399169921875, 0.815399169921875, 0.8492584228515625, 0.88311767578125, 0.9169769287109375, 0.950836181640625, 0.9846954345703125, 1.0185546875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 5.0, 2.0, 7.0, 3.0, 10.0, 15.0, 20.0, 26.0, 39.0, 48.0, 66.0, 89.0, 116.0, 182.0, 262.0, 358.0, 504.0, 804.0, 1162.0, 1894.0, 2992.0, 5191.0, 9537.0, 19099.0, 47629.0, 242950.0, 613039.0, 55866.0, 21335.0, 10374.0, 5643.0, 3307.0, 2012.0, 1274.0, 844.0, 521.0, 389.0, 264.0, 189.0, 140.0, 94.0, 61.0, 48.0, 41.0, 32.0, 20.0, 14.0, 13.0, 9.0, 4.0, 4.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.169921875, -2.102264404296875, -2.03460693359375, -1.966949462890625, -1.8992919921875, -1.831634521484375, -1.76397705078125, -1.696319580078125, -1.628662109375, -1.561004638671875, -1.49334716796875, -1.425689697265625, -1.3580322265625, -1.290374755859375, -1.22271728515625, -1.155059814453125, -1.08740234375, -1.019744873046875, -0.95208740234375, -0.884429931640625, -0.8167724609375, -0.749114990234375, -0.68145751953125, -0.613800048828125, -0.546142578125, -0.478485107421875, -0.41082763671875, -0.343170166015625, -0.2755126953125, -0.207855224609375, -0.14019775390625, -0.072540283203125, -0.0048828125, 0.062774658203125, 0.13043212890625, 0.198089599609375, 0.2657470703125, 0.333404541015625, 0.40106201171875, 0.468719482421875, 0.536376953125, 0.604034423828125, 0.67169189453125, 0.739349365234375, 0.8070068359375, 0.874664306640625, 0.94232177734375, 1.009979248046875, 1.07763671875, 1.145294189453125, 1.21295166015625, 1.280609130859375, 1.3482666015625, 1.415924072265625, 1.48358154296875, 1.551239013671875, 1.618896484375, 1.686553955078125, 1.75421142578125, 1.821868896484375, 1.8895263671875, 1.957183837890625, 2.02484130859375, 2.092498779296875, 2.16015625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 1.0, 6.0, 8.0, 6.0, 11.0, 14.0, 18.0, 26.0, 41.0, 67.0, 154.0, 325.0, 127.0, 59.0, 34.0, 22.0, 24.0, 13.0, 7.0, 9.0, 7.0, 3.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.18832015991211e-05, -6.959866732358932e-05, -6.731413304805756e-05, -6.502959877252579e-05, -6.274506449699402e-05, -6.046053022146225e-05, -5.817599594593048e-05, -5.589146167039871e-05, -5.360692739486694e-05, -5.1322393119335175e-05, -4.9037858843803406e-05, -4.675332456827164e-05, -4.446879029273987e-05, -4.21842560172081e-05, -3.989972174167633e-05, -3.761518746614456e-05, -3.533065319061279e-05, -3.3046118915081024e-05, -3.0761584639549255e-05, -2.8477050364017487e-05, -2.6192516088485718e-05, -2.390798181295395e-05, -2.162344753742218e-05, -1.933891326189041e-05, -1.7054378986358643e-05, -1.4769844710826874e-05, -1.2485310435295105e-05, -1.0200776159763336e-05, -7.916241884231567e-06, -5.631707608699799e-06, -3.3471733331680298e-06, -1.062639057636261e-06, 1.2218952178955078e-06, 3.5064294934272766e-06, 5.790963768959045e-06, 8.075498044490814e-06, 1.0360032320022583e-05, 1.2644566595554352e-05, 1.492910087108612e-05, 1.721363514661789e-05, 1.9498169422149658e-05, 2.1782703697681427e-05, 2.4067237973213196e-05, 2.6351772248744965e-05, 2.8636306524276733e-05, 3.09208407998085e-05, 3.320537507534027e-05, 3.548990935087204e-05, 3.777444362640381e-05, 4.005897790193558e-05, 4.2343512177467346e-05, 4.4628046452999115e-05, 4.6912580728530884e-05, 4.919711500406265e-05, 5.148164927959442e-05, 5.376618355512619e-05, 5.605071783065796e-05, 5.833525210618973e-05, 6.0619786381721497e-05, 6.290432065725327e-05, 6.518885493278503e-05, 6.74733892083168e-05, 6.975792348384857e-05, 7.204245775938034e-05, 7.432699203491211e-05]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 8.0, 12.0, 19.0, 27.0, 28.0, 36.0, 51.0, 80.0, 114.0, 156.0, 229.0, 325.0, 489.0, 759.0, 1127.0, 1744.0, 2923.0, 4821.0, 9122.0, 19354.0, 52656.0, 683914.0, 195774.0, 39968.0, 15471.0, 7801.0, 4321.0, 2557.0, 1494.0, 1015.0, 684.0, 444.0, 282.0, 222.0, 152.0, 108.0, 69.0, 45.0, 41.0, 27.0, 23.0, 14.0, 12.0, 9.0, 8.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.509765625, -2.4310302734375, -2.352294921875, -2.2735595703125, -2.19482421875, -2.1160888671875, -2.037353515625, -1.9586181640625, -1.8798828125, -1.8011474609375, -1.722412109375, -1.6436767578125, -1.56494140625, -1.4862060546875, -1.407470703125, -1.3287353515625, -1.25, -1.1712646484375, -1.092529296875, -1.0137939453125, -0.93505859375, -0.8563232421875, -0.777587890625, -0.6988525390625, -0.6201171875, -0.5413818359375, -0.462646484375, -0.3839111328125, -0.30517578125, -0.2264404296875, -0.147705078125, -0.0689697265625, 0.009765625, 0.0885009765625, 0.167236328125, 0.2459716796875, 0.32470703125, 0.4034423828125, 0.482177734375, 0.5609130859375, 0.6396484375, 0.7183837890625, 0.797119140625, 0.8758544921875, 0.95458984375, 1.0333251953125, 1.112060546875, 1.1907958984375, 1.26953125, 1.3482666015625, 1.427001953125, 1.5057373046875, 1.58447265625, 1.6632080078125, 1.741943359375, 1.8206787109375, 1.8994140625, 1.9781494140625, 2.056884765625, 2.1356201171875, 2.21435546875, 2.2930908203125, 2.371826171875, 2.4505615234375, 2.529296875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 0.0, 4.0, 7.0, 5.0, 4.0, 4.0, 1.0, 8.0, 8.0, 17.0, 30.0, 25.0, 36.0, 56.0, 103.0, 375.0, 111.0, 49.0, 35.0, 34.0, 22.0, 12.0, 14.0, 11.0, 7.0, 5.0, 3.0, 7.0, 5.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.705078125, -0.6834259033203125, -0.661773681640625, -0.6401214599609375, -0.61846923828125, -0.5968170166015625, -0.575164794921875, -0.5535125732421875, -0.5318603515625, -0.5102081298828125, -0.488555908203125, -0.4669036865234375, -0.44525146484375, -0.4235992431640625, -0.401947021484375, -0.3802947998046875, -0.358642578125, -0.3369903564453125, -0.315338134765625, -0.2936859130859375, -0.27203369140625, -0.2503814697265625, -0.228729248046875, -0.2070770263671875, -0.1854248046875, -0.1637725830078125, -0.142120361328125, -0.1204681396484375, -0.09881591796875, -0.0771636962890625, -0.055511474609375, -0.0338592529296875, -0.01220703125, 0.0094451904296875, 0.031097412109375, 0.0527496337890625, 0.07440185546875, 0.0960540771484375, 0.117706298828125, 0.1393585205078125, 0.1610107421875, 0.1826629638671875, 0.204315185546875, 0.2259674072265625, 0.24761962890625, 0.2692718505859375, 0.290924072265625, 0.3125762939453125, 0.334228515625, 0.3558807373046875, 0.377532958984375, 0.3991851806640625, 0.42083740234375, 0.4424896240234375, 0.464141845703125, 0.4857940673828125, 0.5074462890625, 0.5290985107421875, 0.550750732421875, 0.5724029541015625, 0.59405517578125, 0.6157073974609375, 0.637359619140625, 0.6590118408203125, 0.6806640625]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 5.0, 6.0, 7.0, 15.0, 12.0, 21.0, 19.0, 30.0, 44.0, 67.0, 85.0, 105.0, 111.0, 111.0, 84.0, 57.0, 50.0, 39.0, 37.0, 22.0, 16.0, 13.0, 12.0, 10.0, 3.0, 4.0, 6.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.0142390727996826, -1.9521145820617676, -1.889989972114563, -1.8278653621673584, -1.7657408714294434, -1.7036163806915283, -1.6414917707443237, -1.5793671607971191, -1.517242670059204, -1.455118179321289, -1.3929935693740845, -1.3308689594268799, -1.2687444686889648, -1.2066199779510498, -1.1444953680038452, -1.0823707580566406, -1.0202462673187256, -0.9581217169761658, -0.895997166633606, -0.8338726162910461, -0.7717480659484863, -0.7096235156059265, -0.6474989652633667, -0.5853744149208069, -0.5232498645782471, -0.46112531423568726, -0.39900076389312744, -0.3368762135505676, -0.2747516632080078, -0.212627112865448, -0.15050256252288818, -0.08837801218032837, -0.026253461837768555, 0.03587108850479126, 0.09799563884735107, 0.1601201891899109, 0.2222447395324707, 0.2843692898750305, 0.34649384021759033, 0.40861839056015015, 0.47074294090270996, 0.5328674912452698, 0.5949920415878296, 0.6571165919303894, 0.7192411422729492, 0.781365692615509, 0.8434902429580688, 0.9056147933006287, 0.9677393436431885, 1.0298638343811035, 1.091988444328308, 1.1541130542755127, 1.2162375450134277, 1.2783620357513428, 1.3404866456985474, 1.402611255645752, 1.464735746383667, 1.526860237121582, 1.5889848470687866, 1.6511094570159912, 1.7132339477539062, 1.7753584384918213, 1.8374830484390259, 1.8996076583862305, 1.9617321491241455]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 4.0, 3.0, 10.0, 10.0, 11.0, 11.0, 18.0, 18.0, 13.0, 14.0, 27.0, 30.0, 31.0, 50.0, 37.0, 25.0, 31.0, 32.0, 45.0, 40.0, 45.0, 51.0, 43.0, 42.0, 43.0, 31.0, 38.0, 40.0, 36.0, 25.0, 29.0, 31.0, 8.0, 14.0, 9.0, 8.0, 11.0, 3.0, 10.0, 8.0, 6.0, 2.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3962475061416626, -1.3486615419387817, -1.3010754585266113, -1.2534894943237305, -1.2059035301208496, -1.1583174467086792, -1.1107314825057983, -1.063145399093628, -1.015559434890747, -0.9679734110832214, -0.9203874468803406, -0.8728014230728149, -0.8252153992652893, -0.7776293754577637, -0.7300434112548828, -0.6824573874473572, -0.6348714232444763, -0.5872853994369507, -0.5396994352340698, -0.4921134114265442, -0.44452738761901855, -0.3969413936138153, -0.34935539960861206, -0.3017693758010864, -0.2541833817958832, -0.20659737288951874, -0.1590113639831543, -0.11142536997795105, -0.06383936107158661, -0.016253352165222168, 0.03133264183998108, 0.07891866564750671, 0.12650465965270996, 0.1740906685590744, 0.22167667746543884, 0.2692626714706421, 0.3168486952781677, 0.36443468928337097, 0.4120206832885742, 0.45960670709609985, 0.5071927309036255, 0.5547787547111511, 0.602364718914032, 0.6499507427215576, 0.6975367665290833, 0.7451227903366089, 0.7927087545394897, 0.8402947783470154, 0.8878807425498962, 0.9354667663574219, 0.9830527305603027, 1.0306386947631836, 1.078224778175354, 1.1258107423782349, 1.1733968257904053, 1.2209827899932861, 1.268568754196167, 1.3161547183990479, 1.3637408018112183, 1.4113267660140991, 1.45891273021698, 1.5064988136291504, 1.5540847778320312, 1.601670742034912, 1.6492568254470825]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 13.0, 13.0, 15.0, 32.0, 41.0, 64.0, 70.0, 124.0, 166.0, 264.0, 329.0, 495.0, 702.0, 1058.0, 1536.0, 2273.0, 3402.0, 5277.0, 8210.0, 13341.0, 21608.0, 37396.0, 68240.0, 137188.0, 339313.0, 1316552.0, 1509926.0, 393965.0, 151461.0, 75384.0, 41555.0, 23884.0, 14572.0, 8828.0, 5754.0, 3742.0, 2346.0, 1645.0, 1052.0, 764.0, 494.0, 363.0, 262.0, 162.0, 120.0, 97.0, 63.0, 41.0, 21.0, 27.0, 9.0, 11.0, 5.0, 7.0, 3.0, 1.0, 1.0], "bins": [-1.93359375, -1.8751068115234375, -1.816619873046875, -1.7581329345703125, -1.69964599609375, -1.6411590576171875, -1.582672119140625, -1.5241851806640625, -1.4656982421875, -1.4072113037109375, -1.348724365234375, -1.2902374267578125, -1.23175048828125, -1.1732635498046875, -1.114776611328125, -1.0562896728515625, -0.997802734375, -0.9393157958984375, -0.880828857421875, -0.8223419189453125, -0.76385498046875, -0.7053680419921875, -0.646881103515625, -0.5883941650390625, -0.5299072265625, -0.4714202880859375, -0.412933349609375, -0.3544464111328125, -0.29595947265625, -0.2374725341796875, -0.178985595703125, -0.1204986572265625, -0.06201171875, -0.0035247802734375, 0.054962158203125, 0.1134490966796875, 0.17193603515625, 0.2304229736328125, 0.288909912109375, 0.3473968505859375, 0.4058837890625, 0.4643707275390625, 0.522857666015625, 0.5813446044921875, 0.63983154296875, 0.6983184814453125, 0.756805419921875, 0.8152923583984375, 0.873779296875, 0.9322662353515625, 0.990753173828125, 1.0492401123046875, 1.10772705078125, 1.1662139892578125, 1.224700927734375, 1.2831878662109375, 1.3416748046875, 1.4001617431640625, 1.458648681640625, 1.5171356201171875, 1.57562255859375, 1.6341094970703125, 1.692596435546875, 1.7510833740234375, 1.8095703125]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 4.0, 9.0, 9.0, 6.0, 4.0, 20.0, 12.0, 21.0, 11.0, 12.0, 22.0, 25.0, 26.0, 41.0, 36.0, 38.0, 33.0, 26.0, 44.0, 34.0, 49.0, 43.0, 43.0, 46.0, 45.0, 45.0, 30.0, 37.0, 23.0, 27.0, 31.0, 28.0, 16.0, 26.0, 10.0, 13.0, 9.0, 8.0, 8.0, 5.0, 7.0, 6.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8681640625, -0.8392181396484375, -0.810272216796875, -0.7813262939453125, -0.75238037109375, -0.7234344482421875, -0.694488525390625, -0.6655426025390625, -0.6365966796875, -0.6076507568359375, -0.578704833984375, -0.5497589111328125, -0.52081298828125, -0.4918670654296875, -0.462921142578125, -0.4339752197265625, -0.405029296875, -0.3760833740234375, -0.347137451171875, -0.3181915283203125, -0.28924560546875, -0.2602996826171875, -0.231353759765625, -0.2024078369140625, -0.1734619140625, -0.1445159912109375, -0.115570068359375, -0.0866241455078125, -0.05767822265625, -0.0287322998046875, 0.000213623046875, 0.0291595458984375, 0.05810546875, 0.0870513916015625, 0.115997314453125, 0.1449432373046875, 0.17388916015625, 0.2028350830078125, 0.231781005859375, 0.2607269287109375, 0.2896728515625, 0.3186187744140625, 0.347564697265625, 0.3765106201171875, 0.40545654296875, 0.4344024658203125, 0.463348388671875, 0.4922943115234375, 0.521240234375, 0.5501861572265625, 0.579132080078125, 0.6080780029296875, 0.63702392578125, 0.6659698486328125, 0.694915771484375, 0.7238616943359375, 0.7528076171875, 0.7817535400390625, 0.810699462890625, 0.8396453857421875, 0.86859130859375, 0.8975372314453125, 0.926483154296875, 0.9554290771484375, 0.984375]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 3.0, 8.0, 6.0, 9.0, 15.0, 30.0, 27.0, 50.0, 57.0, 94.0, 156.0, 204.0, 316.0, 431.0, 711.0, 1078.0, 1600.0, 2417.0, 3944.0, 6087.0, 9719.0, 15847.0, 26493.0, 45554.0, 82801.0, 158501.0, 337171.0, 907910.0, 1537083.0, 551884.0, 234558.0, 116289.0, 62672.0, 35095.0, 20712.0, 12582.0, 7984.0, 4953.0, 3250.0, 2036.0, 1361.0, 837.0, 578.0, 389.0, 249.0, 159.0, 103.0, 97.0, 64.0, 29.0, 29.0, 18.0, 14.0, 14.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0], "bins": [-1.513671875, -1.466766357421875, -1.41986083984375, -1.372955322265625, -1.3260498046875, -1.279144287109375, -1.23223876953125, -1.185333251953125, -1.138427734375, -1.091522216796875, -1.04461669921875, -0.997711181640625, -0.9508056640625, -0.903900146484375, -0.85699462890625, -0.810089111328125, -0.76318359375, -0.716278076171875, -0.66937255859375, -0.622467041015625, -0.5755615234375, -0.528656005859375, -0.48175048828125, -0.434844970703125, -0.387939453125, -0.341033935546875, -0.29412841796875, -0.247222900390625, -0.2003173828125, -0.153411865234375, -0.10650634765625, -0.059600830078125, -0.0126953125, 0.034210205078125, 0.08111572265625, 0.128021240234375, 0.1749267578125, 0.221832275390625, 0.26873779296875, 0.315643310546875, 0.362548828125, 0.409454345703125, 0.45635986328125, 0.503265380859375, 0.5501708984375, 0.597076416015625, 0.64398193359375, 0.690887451171875, 0.73779296875, 0.784698486328125, 0.83160400390625, 0.878509521484375, 0.9254150390625, 0.972320556640625, 1.01922607421875, 1.066131591796875, 1.113037109375, 1.159942626953125, 1.20684814453125, 1.253753662109375, 1.3006591796875, 1.347564697265625, 1.39447021484375, 1.441375732421875, 1.48828125]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 6.0, 3.0, 3.0, 13.0, 11.0, 14.0, 12.0, 29.0, 25.0, 35.0, 40.0, 60.0, 59.0, 81.0, 82.0, 105.0, 142.0, 147.0, 168.0, 187.0, 209.0, 243.0, 275.0, 221.0, 248.0, 229.0, 182.0, 176.0, 159.0, 118.0, 129.0, 104.0, 96.0, 86.0, 59.0, 63.0, 58.0, 43.0, 25.0, 29.0, 15.0, 18.0, 14.0, 15.0, 8.0, 8.0, 10.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.39990234375, -0.38651275634765625, -0.3731231689453125, -0.35973358154296875, -0.346343994140625, -0.33295440673828125, -0.3195648193359375, -0.30617523193359375, -0.29278564453125, -0.27939605712890625, -0.2660064697265625, -0.25261688232421875, -0.239227294921875, -0.22583770751953125, -0.2124481201171875, -0.19905853271484375, -0.1856689453125, -0.17227935791015625, -0.1588897705078125, -0.14550018310546875, -0.132110595703125, -0.11872100830078125, -0.1053314208984375, -0.09194183349609375, -0.07855224609375, -0.06516265869140625, -0.0517730712890625, -0.03838348388671875, -0.024993896484375, -0.01160430908203125, 0.0017852783203125, 0.01517486572265625, 0.028564453125, 0.04195404052734375, 0.0553436279296875, 0.06873321533203125, 0.082122802734375, 0.09551239013671875, 0.1089019775390625, 0.12229156494140625, 0.13568115234375, 0.14907073974609375, 0.1624603271484375, 0.17584991455078125, 0.189239501953125, 0.20262908935546875, 0.2160186767578125, 0.22940826416015625, 0.2427978515625, 0.25618743896484375, 0.2695770263671875, 0.28296661376953125, 0.296356201171875, 0.30974578857421875, 0.3231353759765625, 0.33652496337890625, 0.34991455078125, 0.36330413818359375, 0.3766937255859375, 0.39008331298828125, 0.403472900390625, 0.41686248779296875, 0.4302520751953125, 0.44364166259765625, 0.45703125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 7.0, 5.0, 7.0, 9.0, 16.0, 12.0, 14.0, 26.0, 24.0, 34.0, 41.0, 53.0, 52.0, 76.0, 97.0, 100.0, 87.0, 69.0, 49.0, 43.0, 31.0, 28.0, 16.0, 24.0, 15.0, 15.0, 8.0, 9.0, 8.0, 6.0, 7.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.128026008605957, -1.0906760692596436, -1.0533260107040405, -1.015976071357727, -0.978626012802124, -0.9412760734558105, -0.9039260745048523, -0.866576075553894, -0.8292260766029358, -0.7918760776519775, -0.7545260787010193, -0.717176079750061, -0.6798261404037476, -0.6424760818481445, -0.605126142501831, -0.5677761435508728, -0.5304261445999146, -0.4930761456489563, -0.45572614669799805, -0.4183761775493622, -0.38102617859840393, -0.3436761796474457, -0.3063262104988098, -0.26897621154785156, -0.2316262125968933, -0.19427621364593506, -0.156926229596138, -0.11957623809576035, -0.08222624659538269, -0.04487624764442444, -0.00752626359462738, 0.029823720455169678, 0.06717383861541748, 0.10452383011579514, 0.1418738216161728, 0.17922380566596985, 0.2165738046169281, 0.25392380356788635, 0.2912737727165222, 0.32862377166748047, 0.3659737706184387, 0.403323769569397, 0.4406737685203552, 0.4780237376689911, 0.515373706817627, 0.55272376537323, 0.5900737047195435, 0.6274237036705017, 0.66477370262146, 0.7021237015724182, 0.7394737005233765, 0.7768236994743347, 0.814173698425293, 0.8515236377716064, 0.8888736367225647, 0.926223635673523, 0.9635736346244812, 1.0009236335754395, 1.038273572921753, 1.075623631477356, 1.1129735708236694, 1.1503236293792725, 1.187673568725586, 1.2250235080718994, 1.2623735666275024]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 6.0, 6.0, 7.0, 9.0, 13.0, 13.0, 21.0, 4.0, 20.0, 22.0, 25.0, 21.0, 24.0, 30.0, 30.0, 32.0, 34.0, 31.0, 44.0, 38.0, 31.0, 29.0, 27.0, 52.0, 42.0, 34.0, 37.0, 37.0, 37.0, 32.0, 22.0, 27.0, 21.0, 22.0, 22.0, 16.0, 15.0, 17.0, 8.0, 11.0, 8.0, 4.0, 8.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9285595417022705, -0.8976151943206787, -0.8666708469390869, -0.8357264995574951, -0.8047821521759033, -0.7738378047943115, -0.7428934574127197, -0.7119491100311279, -0.6810047626495361, -0.6500604152679443, -0.6191160678863525, -0.5881717205047607, -0.557227373123169, -0.5262830257415771, -0.49533870816230774, -0.46439436078071594, -0.43345004320144653, -0.40250569581985474, -0.37156134843826294, -0.34061700105667114, -0.30967265367507935, -0.27872830629348755, -0.24778398871421814, -0.21683964133262634, -0.18589529395103455, -0.15495094656944275, -0.12400660663843155, -0.09306226670742035, -0.06211791932582855, -0.031173571944236755, -0.00022923946380615234, 0.030715107917785645, 0.06165945529937744, 0.09260380268096924, 0.12354814261198044, 0.15449248254299164, 0.18543682992458344, 0.21638117730617523, 0.24732550978660583, 0.27826985716819763, 0.30921420454978943, 0.3401585519313812, 0.371102899312973, 0.40204721689224243, 0.43299156427383423, 0.463935911655426, 0.4948802590370178, 0.5258246064186096, 0.5567689538002014, 0.5877133011817932, 0.618657648563385, 0.6496019959449768, 0.6805463433265686, 0.7114906907081604, 0.7424349784851074, 0.7733793258666992, 0.804323673248291, 0.8352680206298828, 0.8662123680114746, 0.8971567153930664, 0.9281010627746582, 0.95904541015625, 0.9899897575378418, 1.0209341049194336, 1.0518784523010254]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 13.0, 11.0, 17.0, 26.0, 28.0, 55.0, 60.0, 115.0, 164.0, 217.0, 381.0, 450.0, 662.0, 1006.0, 1513.0, 2273.0, 3395.0, 5339.0, 8007.0, 12706.0, 20317.0, 33508.0, 57845.0, 105856.0, 205537.0, 259090.0, 142610.0, 75077.0, 42782.0, 25414.0, 15576.0, 9672.0, 6175.0, 4141.0, 2798.0, 1863.0, 1224.0, 812.0, 564.0, 375.0, 304.0, 168.0, 135.0, 91.0, 57.0, 46.0, 25.0, 18.0, 11.0, 12.0, 6.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.44677734375, -0.4324684143066406, -0.41815948486328125, -0.4038505554199219, -0.3895416259765625, -0.3752326965332031, -0.36092376708984375, -0.3466148376464844, -0.332305908203125, -0.3179969787597656, -0.30368804931640625, -0.2893791198730469, -0.2750701904296875, -0.2607612609863281, -0.24645233154296875, -0.23214340209960938, -0.21783447265625, -0.20352554321289062, -0.18921661376953125, -0.17490768432617188, -0.1605987548828125, -0.14628982543945312, -0.13198089599609375, -0.11767196655273438, -0.103363037109375, -0.08905410766601562, -0.07474517822265625, -0.060436248779296875, -0.0461273193359375, -0.031818389892578125, -0.01750946044921875, -0.003200531005859375, 0.0111083984375, 0.025417327880859375, 0.03972625732421875, 0.054035186767578125, 0.0683441162109375, 0.08265304565429688, 0.09696197509765625, 0.11127090454101562, 0.125579833984375, 0.13988876342773438, 0.15419769287109375, 0.16850662231445312, 0.1828155517578125, 0.19712448120117188, 0.21143341064453125, 0.22574234008789062, 0.24005126953125, 0.2543601989746094, 0.26866912841796875, 0.2829780578613281, 0.2972869873046875, 0.3115959167480469, 0.32590484619140625, 0.3402137756347656, 0.354522705078125, 0.3688316345214844, 0.38314056396484375, 0.3974494934082031, 0.4117584228515625, 0.4260673522949219, 0.44037628173828125, 0.4546852111816406, 0.468994140625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 4.0, 4.0, 6.0, 11.0, 11.0, 10.0, 10.0, 10.0, 17.0, 24.0, 23.0, 28.0, 30.0, 37.0, 23.0, 25.0, 41.0, 40.0, 32.0, 34.0, 45.0, 33.0, 46.0, 41.0, 47.0, 46.0, 33.0, 46.0, 36.0, 28.0, 21.0, 18.0, 23.0, 12.0, 14.0, 22.0, 13.0, 14.0, 7.0, 13.0, 8.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.005859375, -0.97296142578125, -0.9400634765625, -0.90716552734375, -0.874267578125, -0.84136962890625, -0.8084716796875, -0.77557373046875, -0.74267578125, -0.70977783203125, -0.6768798828125, -0.64398193359375, -0.611083984375, -0.57818603515625, -0.5452880859375, -0.51239013671875, -0.4794921875, -0.44659423828125, -0.4136962890625, -0.38079833984375, -0.347900390625, -0.31500244140625, -0.2821044921875, -0.24920654296875, -0.21630859375, -0.18341064453125, -0.1505126953125, -0.11761474609375, -0.084716796875, -0.05181884765625, -0.0189208984375, 0.01397705078125, 0.046875, 0.07977294921875, 0.1126708984375, 0.14556884765625, 0.178466796875, 0.21136474609375, 0.2442626953125, 0.27716064453125, 0.31005859375, 0.34295654296875, 0.3758544921875, 0.40875244140625, 0.441650390625, 0.47454833984375, 0.5074462890625, 0.54034423828125, 0.5732421875, 0.60614013671875, 0.6390380859375, 0.67193603515625, 0.704833984375, 0.73773193359375, 0.7706298828125, 0.80352783203125, 0.83642578125, 0.86932373046875, 0.9022216796875, 0.93511962890625, 0.968017578125, 1.00091552734375, 1.0338134765625, 1.06671142578125, 1.099609375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [5.0, 3.0, 3.0, 1.0, 5.0, 4.0, 6.0, 7.0, 8.0, 13.0, 18.0, 24.0, 33.0, 61.0, 86.0, 90.0, 137.0, 177.0, 276.0, 354.0, 513.0, 654.0, 942.0, 1405.0, 1878.0, 2685.0, 4127.0, 6680.0, 11510.0, 21297.0, 46670.0, 122056.0, 400096.0, 263704.0, 84580.0, 34735.0, 16907.0, 9294.0, 5551.0, 3641.0, 2481.0, 1650.0, 1160.0, 837.0, 633.0, 434.0, 298.0, 210.0, 165.0, 118.0, 84.0, 69.0, 64.0, 47.0, 25.0, 17.0, 16.0, 8.0, 4.0, 9.0, 3.0, 4.0, 1.0, 3.0], "bins": [-0.6630859375, -0.64288330078125, -0.6226806640625, -0.60247802734375, -0.582275390625, -0.56207275390625, -0.5418701171875, -0.52166748046875, -0.50146484375, -0.48126220703125, -0.4610595703125, -0.44085693359375, -0.420654296875, -0.40045166015625, -0.3802490234375, -0.36004638671875, -0.33984375, -0.31964111328125, -0.2994384765625, -0.27923583984375, -0.259033203125, -0.23883056640625, -0.2186279296875, -0.19842529296875, -0.17822265625, -0.15802001953125, -0.1378173828125, -0.11761474609375, -0.097412109375, -0.07720947265625, -0.0570068359375, -0.03680419921875, -0.0166015625, 0.00360107421875, 0.0238037109375, 0.04400634765625, 0.064208984375, 0.08441162109375, 0.1046142578125, 0.12481689453125, 0.14501953125, 0.16522216796875, 0.1854248046875, 0.20562744140625, 0.225830078125, 0.24603271484375, 0.2662353515625, 0.28643798828125, 0.306640625, 0.32684326171875, 0.3470458984375, 0.36724853515625, 0.387451171875, 0.40765380859375, 0.4278564453125, 0.44805908203125, 0.46826171875, 0.48846435546875, 0.5086669921875, 0.52886962890625, 0.549072265625, 0.56927490234375, 0.5894775390625, 0.60968017578125, 0.6298828125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 5.0, 10.0, 8.0, 12.0, 19.0, 16.0, 12.0, 30.0, 28.0, 24.0, 34.0, 29.0, 55.0, 43.0, 39.0, 29.0, 28.0, 35.0, 42.0, 53.0, 43.0, 48.0, 38.0, 35.0, 37.0, 37.0, 40.0, 35.0, 21.0, 28.0, 14.0, 16.0, 10.0, 16.0, 8.0, 8.0, 6.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.75048828125, -0.7274856567382812, -0.7044830322265625, -0.6814804077148438, -0.658477783203125, -0.6354751586914062, -0.6124725341796875, -0.5894699096679688, -0.56646728515625, -0.5434646606445312, -0.5204620361328125, -0.49745941162109375, -0.474456787109375, -0.45145416259765625, -0.4284515380859375, -0.40544891357421875, -0.3824462890625, -0.35944366455078125, -0.3364410400390625, -0.31343841552734375, -0.290435791015625, -0.26743316650390625, -0.2444305419921875, -0.22142791748046875, -0.19842529296875, -0.17542266845703125, -0.1524200439453125, -0.12941741943359375, -0.106414794921875, -0.08341217041015625, -0.0604095458984375, -0.03740692138671875, -0.014404296875, 0.00859832763671875, 0.0316009521484375, 0.05460357666015625, 0.077606201171875, 0.10060882568359375, 0.1236114501953125, 0.14661407470703125, 0.16961669921875, 0.19261932373046875, 0.2156219482421875, 0.23862457275390625, 0.261627197265625, 0.28462982177734375, 0.3076324462890625, 0.33063507080078125, 0.3536376953125, 0.37664031982421875, 0.3996429443359375, 0.42264556884765625, 0.445648193359375, 0.46865081787109375, 0.4916534423828125, 0.5146560668945312, 0.53765869140625, 0.5606613159179688, 0.5836639404296875, 0.6066665649414062, 0.629669189453125, 0.6526718139648438, 0.6756744384765625, 0.6986770629882812, 0.7216796875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 6.0, 2.0, 9.0, 11.0, 17.0, 23.0, 31.0, 53.0, 80.0, 104.0, 136.0, 185.0, 264.0, 421.0, 595.0, 923.0, 1325.0, 1734.0, 2704.0, 4543.0, 7769.0, 15056.0, 34627.0, 115135.0, 643505.0, 141423.0, 38983.0, 16591.0, 8525.0, 4676.0, 2876.0, 1908.0, 1284.0, 930.0, 683.0, 460.0, 318.0, 188.0, 141.0, 120.0, 56.0, 45.0, 33.0, 24.0, 11.0, 6.0, 7.0, 8.0, 1.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.08367919921875, -0.08094120025634766, -0.07820320129394531, -0.07546520233154297, -0.07272720336914062, -0.06998920440673828, -0.06725120544433594, -0.0645132064819336, -0.06177520751953125, -0.059037208557128906, -0.05629920959472656, -0.05356121063232422, -0.050823211669921875, -0.04808521270751953, -0.04534721374511719, -0.042609214782714844, -0.0398712158203125, -0.037133216857910156, -0.03439521789550781, -0.03165721893310547, -0.028919219970703125, -0.02618122100830078, -0.023443222045898438, -0.020705223083496094, -0.01796722412109375, -0.015229225158691406, -0.012491226196289062, -0.009753227233886719, -0.007015228271484375, -0.004277229309082031, -0.0015392303466796875, 0.0011987686157226562, 0.003936767578125, 0.006674766540527344, 0.009412765502929688, 0.012150764465332031, 0.014888763427734375, 0.01762676239013672, 0.020364761352539062, 0.023102760314941406, 0.02584075927734375, 0.028578758239746094, 0.03131675720214844, 0.03405475616455078, 0.036792755126953125, 0.03953075408935547, 0.04226875305175781, 0.045006752014160156, 0.0477447509765625, 0.050482749938964844, 0.05322074890136719, 0.05595874786376953, 0.058696746826171875, 0.06143474578857422, 0.06417274475097656, 0.0669107437133789, 0.06964874267578125, 0.0723867416381836, 0.07512474060058594, 0.07786273956298828, 0.08060073852539062, 0.08333873748779297, 0.08607673645019531, 0.08881473541259766, 0.091552734375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 1.0, 0.0, 2.0, 6.0, 3.0, 8.0, 4.0, 3.0, 7.0, 8.0, 15.0, 24.0, 24.0, 20.0, 45.0, 44.0, 56.0, 92.0, 109.0, 124.0, 100.0, 69.0, 48.0, 34.0, 44.0, 19.0, 21.0, 10.0, 10.0, 10.0, 15.0, 4.0, 3.0, 2.0, 8.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-6.139278411865234e-06, -5.973502993583679e-06, -5.807727575302124e-06, -5.641952157020569e-06, -5.476176738739014e-06, -5.3104013204574585e-06, -5.144625902175903e-06, -4.978850483894348e-06, -4.813075065612793e-06, -4.647299647331238e-06, -4.481524229049683e-06, -4.3157488107681274e-06, -4.149973392486572e-06, -3.984197974205017e-06, -3.818422555923462e-06, -3.6526471376419067e-06, -3.4868717193603516e-06, -3.3210963010787964e-06, -3.155320882797241e-06, -2.989545464515686e-06, -2.823770046234131e-06, -2.6579946279525757e-06, -2.4922192096710205e-06, -2.3264437913894653e-06, -2.16066837310791e-06, -1.994892954826355e-06, -1.8291175365447998e-06, -1.6633421182632446e-06, -1.4975666999816895e-06, -1.3317912817001343e-06, -1.166015863418579e-06, -1.000240445137024e-06, -8.344650268554688e-07, -6.686896085739136e-07, -5.029141902923584e-07, -3.371387720108032e-07, -1.7136335372924805e-07, -5.587935447692871e-09, 1.601874828338623e-07, 3.259629011154175e-07, 4.917383193969727e-07, 6.575137376785278e-07, 8.23289155960083e-07, 9.890645742416382e-07, 1.1548399925231934e-06, 1.3206154108047485e-06, 1.4863908290863037e-06, 1.6521662473678589e-06, 1.817941665649414e-06, 1.9837170839309692e-06, 2.1494925022125244e-06, 2.3152679204940796e-06, 2.4810433387756348e-06, 2.64681875705719e-06, 2.812594175338745e-06, 2.9783695936203003e-06, 3.1441450119018555e-06, 3.3099204301834106e-06, 3.475695848464966e-06, 3.641471266746521e-06, 3.807246685028076e-06, 3.973022103309631e-06, 4.1387975215911865e-06, 4.304572939872742e-06, 4.470348358154297e-06]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 12.0, 7.0, 14.0, 20.0, 30.0, 44.0, 36.0, 84.0, 101.0, 189.0, 276.0, 445.0, 764.0, 1188.0, 2003.0, 3393.0, 6004.0, 10633.0, 19824.0, 40767.0, 104240.0, 462411.0, 256480.0, 71767.0, 31297.0, 15753.0, 8639.0, 4884.0, 2840.0, 1670.0, 1009.0, 639.0, 365.0, 226.0, 153.0, 115.0, 63.0, 60.0, 34.0, 25.0, 20.0, 9.0, 6.0, 6.0, 6.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08612060546875, -0.08313274383544922, -0.08014488220214844, -0.07715702056884766, -0.07416915893554688, -0.0711812973022461, -0.06819343566894531, -0.06520557403564453, -0.06221771240234375, -0.05922985076904297, -0.05624198913574219, -0.053254127502441406, -0.050266265869140625, -0.047278404235839844, -0.04429054260253906, -0.04130268096923828, -0.0383148193359375, -0.03532695770263672, -0.03233909606933594, -0.029351234436035156, -0.026363372802734375, -0.023375511169433594, -0.020387649536132812, -0.01739978790283203, -0.01441192626953125, -0.011424064636230469, -0.008436203002929688, -0.005448341369628906, -0.002460479736328125, 0.0005273818969726562, 0.0035152435302734375, 0.006503105163574219, 0.009490966796875, 0.012478828430175781, 0.015466690063476562, 0.018454551696777344, 0.021442413330078125, 0.024430274963378906, 0.027418136596679688, 0.03040599822998047, 0.03339385986328125, 0.03638172149658203, 0.03936958312988281, 0.042357444763183594, 0.045345306396484375, 0.048333168029785156, 0.05132102966308594, 0.05430889129638672, 0.0572967529296875, 0.06028461456298828, 0.06327247619628906, 0.06626033782958984, 0.06924819946289062, 0.0722360610961914, 0.07522392272949219, 0.07821178436279297, 0.08119964599609375, 0.08418750762939453, 0.08717536926269531, 0.0901632308959961, 0.09315109252929688, 0.09613895416259766, 0.09912681579589844, 0.10211467742919922, 0.1051025390625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 3.0, 3.0, 3.0, 7.0, 6.0, 18.0, 9.0, 13.0, 20.0, 23.0, 31.0, 57.0, 99.0, 180.0, 182.0, 121.0, 58.0, 29.0, 19.0, 17.0, 17.0, 17.0, 17.0, 7.0, 6.0, 6.0, 9.0, 5.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041229248046875, -0.03970956802368164, -0.03818988800048828, -0.03667020797729492, -0.03515052795410156, -0.0336308479309082, -0.032111167907714844, -0.030591487884521484, -0.029071807861328125, -0.027552127838134766, -0.026032447814941406, -0.024512767791748047, -0.022993087768554688, -0.021473407745361328, -0.01995372772216797, -0.01843404769897461, -0.01691436767578125, -0.01539468765258789, -0.013875007629394531, -0.012355327606201172, -0.010835647583007812, -0.009315967559814453, -0.007796287536621094, -0.006276607513427734, -0.004756927490234375, -0.0032372474670410156, -0.0017175674438476562, -0.00019788742065429688, 0.0013217926025390625, 0.002841472625732422, 0.004361152648925781, 0.005880832672119141, 0.0074005126953125, 0.00892019271850586, 0.010439872741699219, 0.011959552764892578, 0.013479232788085938, 0.014998912811279297, 0.016518592834472656, 0.018038272857666016, 0.019557952880859375, 0.021077632904052734, 0.022597312927246094, 0.024116992950439453, 0.025636672973632812, 0.027156352996826172, 0.02867603302001953, 0.03019571304321289, 0.03171539306640625, 0.03323507308959961, 0.03475475311279297, 0.03627443313598633, 0.03779411315917969, 0.03931379318237305, 0.040833473205566406, 0.042353153228759766, 0.043872833251953125, 0.045392513275146484, 0.046912193298339844, 0.0484318733215332, 0.04995155334472656, 0.05147123336791992, 0.05299091339111328, 0.05451059341430664, 0.0560302734375]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 6.0, 6.0, 6.0, 5.0, 18.0, 14.0, 14.0, 25.0, 23.0, 30.0, 52.0, 45.0, 58.0, 95.0, 112.0, 96.0, 76.0, 64.0, 48.0, 42.0, 25.0, 30.0, 18.0, 22.0, 18.0, 9.0, 10.0, 6.0, 6.0, 7.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1446946859359741, -1.1064720153808594, -1.0682493448257446, -1.0300266742706299, -0.9918039441108704, -0.9535812139511108, -0.9153585433959961, -0.8771358728408813, -0.8389132022857666, -0.8006905317306519, -0.7624678015708923, -0.7242451310157776, -0.6860224604606628, -0.6477997303009033, -0.6095770597457886, -0.5713543891906738, -0.5331316590309143, -0.4949089586734772, -0.4566862881183624, -0.4184635877609253, -0.38024091720581055, -0.3420182168483734, -0.3037955164909363, -0.26557284593582153, -0.2273501455783844, -0.18912746012210846, -0.15090477466583252, -0.11268207430839539, -0.07445938885211945, -0.036236703395843506, 0.001985996961593628, 0.040208667516708374, 0.07843136787414551, 0.11665405333042145, 0.1548767387866974, 0.19309943914413452, 0.23132212460041046, 0.2695448100566864, 0.30776751041412354, 0.3459901809692383, 0.3842128813266754, 0.42243558168411255, 0.4606582522392273, 0.49888095259666443, 0.5371036529541016, 0.5753263235092163, 0.613548994064331, 0.6517716646194458, 0.6899943947792053, 0.7282170653343201, 0.7664397954940796, 0.8046624660491943, 0.8428851366043091, 0.8811078071594238, 0.9193305373191833, 0.9575532078742981, 0.9957759380340576, 1.0339986085891724, 1.072221279144287, 1.1104440689086914, 1.1486667394638062, 1.186889410018921, 1.2251120805740356, 1.2633347511291504, 1.3015574216842651]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 7.0, 8.0, 7.0, 14.0, 12.0, 21.0, 6.0, 18.0, 26.0, 21.0, 21.0, 24.0, 29.0, 30.0, 33.0, 34.0, 28.0, 45.0, 38.0, 30.0, 31.0, 29.0, 52.0, 37.0, 38.0, 38.0, 34.0, 36.0, 34.0, 25.0, 22.0, 26.0, 18.0, 23.0, 18.0, 13.0, 17.0, 10.0, 9.0, 9.0, 6.0, 7.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.9195966720581055, -0.8888828754425049, -0.8581690788269043, -0.8274552822113037, -0.7967415452003479, -0.7660277485847473, -0.7353139519691467, -0.7046001553535461, -0.6738863587379456, -0.643172562122345, -0.6124587655067444, -0.5817450284957886, -0.551031231880188, -0.5203174352645874, -0.4896036386489868, -0.45888984203338623, -0.42817607522010803, -0.39746227860450745, -0.36674851179122925, -0.33603471517562866, -0.3053209185600281, -0.2746071219444275, -0.2438933551311493, -0.2131795585155487, -0.18246577680110931, -0.15175199508666992, -0.12103819847106934, -0.09032441675662994, -0.059610627591609955, -0.028896838426589966, 0.0018169432878494263, 0.03253073990345001, 0.0632445216178894, 0.0939583107829094, 0.12467209994792938, 0.15538588166236877, 0.18609967827796936, 0.21681345999240875, 0.24752724170684814, 0.27824103832244873, 0.3089548349380493, 0.3396686315536499, 0.3703823983669281, 0.4010961949825287, 0.4318099915981293, 0.46252375841140747, 0.49323755502700806, 0.5239513516426086, 0.5546650886535645, 0.585378885269165, 0.6160926818847656, 0.6468064785003662, 0.677520215511322, 0.7082340121269226, 0.7389478087425232, 0.7696616053581238, 0.8003754019737244, 0.831089198589325, 0.8618029952049255, 0.8925167322158813, 0.9232305288314819, 0.9539443254470825, 0.9846581220626831, 1.0153719186782837, 1.0460857152938843]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 7.0, 7.0, 13.0, 18.0, 24.0, 40.0, 54.0, 58.0, 120.0, 156.0, 276.0, 367.0, 520.0, 783.0, 1194.0, 1692.0, 2552.0, 4036.0, 6481.0, 10575.0, 17665.0, 30460.0, 55406.0, 104762.0, 203298.0, 268035.0, 155310.0, 79248.0, 43051.0, 24120.0, 14337.0, 8548.0, 5403.0, 3298.0, 2195.0, 1396.0, 924.0, 669.0, 458.0, 309.0, 213.0, 154.0, 110.0, 69.0, 45.0, 37.0, 21.0, 21.0, 10.0, 6.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6591796875, -1.6061553955078125, -1.553131103515625, -1.5001068115234375, -1.44708251953125, -1.3940582275390625, -1.341033935546875, -1.2880096435546875, -1.2349853515625, -1.1819610595703125, -1.128936767578125, -1.0759124755859375, -1.02288818359375, -0.9698638916015625, -0.916839599609375, -0.8638153076171875, -0.810791015625, -0.7577667236328125, -0.704742431640625, -0.6517181396484375, -0.59869384765625, -0.5456695556640625, -0.492645263671875, -0.4396209716796875, -0.3865966796875, -0.3335723876953125, -0.280548095703125, -0.2275238037109375, -0.17449951171875, -0.1214752197265625, -0.068450927734375, -0.0154266357421875, 0.03759765625, 0.0906219482421875, 0.143646240234375, 0.1966705322265625, 0.24969482421875, 0.3027191162109375, 0.355743408203125, 0.4087677001953125, 0.4617919921875, 0.5148162841796875, 0.567840576171875, 0.6208648681640625, 0.67388916015625, 0.7269134521484375, 0.779937744140625, 0.8329620361328125, 0.885986328125, 0.9390106201171875, 0.992034912109375, 1.0450592041015625, 1.09808349609375, 1.1511077880859375, 1.204132080078125, 1.2571563720703125, 1.3101806640625, 1.3632049560546875, 1.416229248046875, 1.4692535400390625, 1.52227783203125, 1.5753021240234375, 1.628326416015625, 1.6813507080078125, 1.734375]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 2.0, 6.0, 8.0, 10.0, 15.0, 14.0, 14.0, 10.0, 16.0, 19.0, 27.0, 24.0, 36.0, 15.0, 41.0, 39.0, 42.0, 35.0, 40.0, 34.0, 35.0, 40.0, 47.0, 50.0, 34.0, 35.0, 33.0, 37.0, 33.0, 34.0, 17.0, 24.0, 18.0, 26.0, 18.0, 16.0, 15.0, 13.0, 4.0, 7.0, 7.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.81494140625, -0.786956787109375, -0.75897216796875, -0.730987548828125, -0.7030029296875, -0.675018310546875, -0.64703369140625, -0.619049072265625, -0.591064453125, -0.563079833984375, -0.53509521484375, -0.507110595703125, -0.4791259765625, -0.451141357421875, -0.42315673828125, -0.395172119140625, -0.3671875, -0.339202880859375, -0.31121826171875, -0.283233642578125, -0.2552490234375, -0.227264404296875, -0.19927978515625, -0.171295166015625, -0.143310546875, -0.115325927734375, -0.08734130859375, -0.059356689453125, -0.0313720703125, -0.003387451171875, 0.02459716796875, 0.052581787109375, 0.08056640625, 0.108551025390625, 0.13653564453125, 0.164520263671875, 0.1925048828125, 0.220489501953125, 0.24847412109375, 0.276458740234375, 0.304443359375, 0.332427978515625, 0.36041259765625, 0.388397216796875, 0.4163818359375, 0.444366455078125, 0.47235107421875, 0.500335693359375, 0.5283203125, 0.556304931640625, 0.58428955078125, 0.612274169921875, 0.6402587890625, 0.668243408203125, 0.69622802734375, 0.724212646484375, 0.752197265625, 0.780181884765625, 0.80816650390625, 0.836151123046875, 0.8641357421875, 0.892120361328125, 0.92010498046875, 0.948089599609375, 0.97607421875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 8.0, 10.0, 23.0, 22.0, 45.0, 71.0, 113.0, 131.0, 198.0, 305.0, 502.0, 791.0, 1333.0, 2034.0, 3448.0, 5729.0, 10292.0, 18795.0, 35644.0, 72500.0, 161107.0, 322489.0, 217154.0, 95868.0, 45876.0, 23458.0, 12624.0, 7180.0, 4190.0, 2411.0, 1514.0, 989.0, 603.0, 350.0, 218.0, 182.0, 115.0, 70.0, 49.0, 32.0, 26.0, 18.0, 9.0, 8.0, 8.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.9345703125, -1.873504638671875, -1.81243896484375, -1.751373291015625, -1.6903076171875, -1.629241943359375, -1.56817626953125, -1.507110595703125, -1.446044921875, -1.384979248046875, -1.32391357421875, -1.262847900390625, -1.2017822265625, -1.140716552734375, -1.07965087890625, -1.018585205078125, -0.95751953125, -0.896453857421875, -0.83538818359375, -0.774322509765625, -0.7132568359375, -0.652191162109375, -0.59112548828125, -0.530059814453125, -0.468994140625, -0.407928466796875, -0.34686279296875, -0.285797119140625, -0.2247314453125, -0.163665771484375, -0.10260009765625, -0.041534423828125, 0.01953125, 0.080596923828125, 0.14166259765625, 0.202728271484375, 0.2637939453125, 0.324859619140625, 0.38592529296875, 0.446990966796875, 0.508056640625, 0.569122314453125, 0.63018798828125, 0.691253662109375, 0.7523193359375, 0.813385009765625, 0.87445068359375, 0.935516357421875, 0.99658203125, 1.057647705078125, 1.11871337890625, 1.179779052734375, 1.2408447265625, 1.301910400390625, 1.36297607421875, 1.424041748046875, 1.485107421875, 1.546173095703125, 1.60723876953125, 1.668304443359375, 1.7293701171875, 1.790435791015625, 1.85150146484375, 1.912567138671875, 1.9736328125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 9.0, 8.0, 7.0, 13.0, 12.0, 20.0, 18.0, 18.0, 17.0, 31.0, 28.0, 24.0, 29.0, 34.0, 45.0, 35.0, 43.0, 45.0, 43.0, 40.0, 36.0, 52.0, 30.0, 47.0, 39.0, 30.0, 36.0, 32.0, 28.0, 14.0, 19.0, 14.0, 16.0, 15.0, 15.0, 12.0, 15.0, 6.0, 9.0, 7.0, 1.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.623046875, -0.6044921875, -0.5859375, -0.5673828125, -0.548828125, -0.5302734375, -0.51171875, -0.4931640625, -0.474609375, -0.4560546875, -0.4375, -0.4189453125, -0.400390625, -0.3818359375, -0.36328125, -0.3447265625, -0.326171875, -0.3076171875, -0.2890625, -0.2705078125, -0.251953125, -0.2333984375, -0.21484375, -0.1962890625, -0.177734375, -0.1591796875, -0.140625, -0.1220703125, -0.103515625, -0.0849609375, -0.06640625, -0.0478515625, -0.029296875, -0.0107421875, 0.0078125, 0.0263671875, 0.044921875, 0.0634765625, 0.08203125, 0.1005859375, 0.119140625, 0.1376953125, 0.15625, 0.1748046875, 0.193359375, 0.2119140625, 0.23046875, 0.2490234375, 0.267578125, 0.2861328125, 0.3046875, 0.3232421875, 0.341796875, 0.3603515625, 0.37890625, 0.3974609375, 0.416015625, 0.4345703125, 0.453125, 0.4716796875, 0.490234375, 0.5087890625, 0.52734375, 0.5458984375, 0.564453125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 3.0, 4.0, 6.0, 5.0, 14.0, 18.0, 23.0, 37.0, 40.0, 69.0, 99.0, 125.0, 188.0, 235.0, 318.0, 442.0, 637.0, 899.0, 1307.0, 1679.0, 2404.0, 3489.0, 5032.0, 7825.0, 13056.0, 24429.0, 55185.0, 692633.0, 146321.0, 40168.0, 19414.0, 10616.0, 6705.0, 4311.0, 3140.0, 2132.0, 1542.0, 1122.0, 782.0, 614.0, 409.0, 322.0, 217.0, 153.0, 103.0, 100.0, 55.0, 37.0, 32.0, 26.0, 15.0, 5.0, 4.0, 11.0, 6.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.91943359375, -0.8896102905273438, -0.8597869873046875, -0.8299636840820312, -0.800140380859375, -0.7703170776367188, -0.7404937744140625, -0.7106704711914062, -0.68084716796875, -0.6510238647460938, -0.6212005615234375, -0.5913772583007812, -0.561553955078125, -0.5317306518554688, -0.5019073486328125, -0.47208404541015625, -0.4422607421875, -0.41243743896484375, -0.3826141357421875, -0.35279083251953125, -0.322967529296875, -0.29314422607421875, -0.2633209228515625, -0.23349761962890625, -0.20367431640625, -0.17385101318359375, -0.1440277099609375, -0.11420440673828125, -0.084381103515625, -0.05455780029296875, -0.0247344970703125, 0.00508880615234375, 0.034912109375, 0.06473541259765625, 0.0945587158203125, 0.12438201904296875, 0.154205322265625, 0.18402862548828125, 0.2138519287109375, 0.24367523193359375, 0.27349853515625, 0.30332183837890625, 0.3331451416015625, 0.36296844482421875, 0.392791748046875, 0.42261505126953125, 0.4524383544921875, 0.48226165771484375, 0.5120849609375, 0.5419082641601562, 0.5717315673828125, 0.6015548706054688, 0.631378173828125, 0.6612014770507812, 0.6910247802734375, 0.7208480834960938, 0.75067138671875, 0.7804946899414062, 0.8103179931640625, 0.8401412963867188, 0.869964599609375, 0.8997879028320312, 0.9296112060546875, 0.9594345092773438, 0.9892578125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 9.0, 3.0, 3.0, 5.0, 16.0, 7.0, 14.0, 25.0, 35.0, 41.0, 106.0, 312.0, 202.0, 63.0, 41.0, 36.0, 18.0, 9.0, 10.0, 8.0, 6.0, 7.0, 3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.017353057861328e-05, -3.898702561855316e-05, -3.780052065849304e-05, -3.661401569843292e-05, -3.54275107383728e-05, -3.424100577831268e-05, -3.3054500818252563e-05, -3.1867995858192444e-05, -3.0681490898132324e-05, -2.9494985938072205e-05, -2.8308480978012085e-05, -2.7121976017951965e-05, -2.5935471057891846e-05, -2.4748966097831726e-05, -2.3562461137771606e-05, -2.2375956177711487e-05, -2.1189451217651367e-05, -2.0002946257591248e-05, -1.8816441297531128e-05, -1.7629936337471008e-05, -1.644343137741089e-05, -1.5256926417350769e-05, -1.407042145729065e-05, -1.288391649723053e-05, -1.169741153717041e-05, -1.051090657711029e-05, -9.324401617050171e-06, -8.137896656990051e-06, -6.951391696929932e-06, -5.764886736869812e-06, -4.578381776809692e-06, -3.3918768167495728e-06, -2.205371856689453e-06, -1.0188668966293335e-06, 1.6763806343078613e-07, 1.3541430234909058e-06, 2.5406479835510254e-06, 3.727152943611145e-06, 4.913657903671265e-06, 6.100162863731384e-06, 7.286667823791504e-06, 8.473172783851624e-06, 9.659677743911743e-06, 1.0846182703971863e-05, 1.2032687664031982e-05, 1.3219192624092102e-05, 1.4405697584152222e-05, 1.559220254421234e-05, 1.677870750427246e-05, 1.796521246433258e-05, 1.91517174243927e-05, 2.033822238445282e-05, 2.152472734451294e-05, 2.271123230457306e-05, 2.389773726463318e-05, 2.50842422246933e-05, 2.6270747184753418e-05, 2.7457252144813538e-05, 2.8643757104873657e-05, 2.9830262064933777e-05, 3.1016767024993896e-05, 3.2203271985054016e-05, 3.3389776945114136e-05, 3.4576281905174255e-05, 3.5762786865234375e-05]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 1.0, 9.0, 10.0, 10.0, 18.0, 25.0, 26.0, 33.0, 55.0, 70.0, 96.0, 139.0, 179.0, 278.0, 401.0, 577.0, 864.0, 1256.0, 2004.0, 3005.0, 4984.0, 8233.0, 14941.0, 29826.0, 82575.0, 744358.0, 86205.0, 30392.0, 15225.0, 8540.0, 4953.0, 3109.0, 2039.0, 1318.0, 833.0, 575.0, 456.0, 273.0, 188.0, 142.0, 98.0, 66.0, 45.0, 42.0, 38.0, 20.0, 10.0, 7.0, 7.0, 4.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.8818359375, -0.851959228515625, -0.82208251953125, -0.792205810546875, -0.7623291015625, -0.732452392578125, -0.70257568359375, -0.672698974609375, -0.642822265625, -0.612945556640625, -0.58306884765625, -0.553192138671875, -0.5233154296875, -0.493438720703125, -0.46356201171875, -0.433685302734375, -0.40380859375, -0.373931884765625, -0.34405517578125, -0.314178466796875, -0.2843017578125, -0.254425048828125, -0.22454833984375, -0.194671630859375, -0.164794921875, -0.134918212890625, -0.10504150390625, -0.075164794921875, -0.0452880859375, -0.015411376953125, 0.01446533203125, 0.044342041015625, 0.07421875, 0.104095458984375, 0.13397216796875, 0.163848876953125, 0.1937255859375, 0.223602294921875, 0.25347900390625, 0.283355712890625, 0.313232421875, 0.343109130859375, 0.37298583984375, 0.402862548828125, 0.4327392578125, 0.462615966796875, 0.49249267578125, 0.522369384765625, 0.55224609375, 0.582122802734375, 0.61199951171875, 0.641876220703125, 0.6717529296875, 0.701629638671875, 0.73150634765625, 0.761383056640625, 0.791259765625, 0.821136474609375, 0.85101318359375, 0.880889892578125, 0.9107666015625, 0.940643310546875, 0.97052001953125, 1.000396728515625, 1.0302734375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 5.0, 3.0, 5.0, 7.0, 10.0, 5.0, 9.0, 6.0, 18.0, 17.0, 17.0, 21.0, 31.0, 40.0, 87.0, 421.0, 65.0, 52.0, 32.0, 22.0, 12.0, 15.0, 18.0, 20.0, 8.0, 5.0, 9.0, 5.0, 5.0, 3.0, 4.0, 5.0, 4.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1968994140625, -0.1894512176513672, -0.18200302124023438, -0.17455482482910156, -0.16710662841796875, -0.15965843200683594, -0.15221023559570312, -0.1447620391845703, -0.1373138427734375, -0.1298656463623047, -0.12241744995117188, -0.11496925354003906, -0.10752105712890625, -0.10007286071777344, -0.09262466430664062, -0.08517646789550781, -0.077728271484375, -0.07028007507324219, -0.06283187866210938, -0.05538368225097656, -0.04793548583984375, -0.04048728942871094, -0.033039093017578125, -0.025590896606445312, -0.0181427001953125, -0.010694503784179688, -0.003246307373046875, 0.0042018890380859375, 0.01165008544921875, 0.019098281860351562, 0.026546478271484375, 0.03399467468261719, 0.04144287109375, 0.04889106750488281, 0.056339263916015625, 0.06378746032714844, 0.07123565673828125, 0.07868385314941406, 0.08613204956054688, 0.09358024597167969, 0.1010284423828125, 0.10847663879394531, 0.11592483520507812, 0.12337303161621094, 0.13082122802734375, 0.13826942443847656, 0.14571762084960938, 0.1531658172607422, 0.160614013671875, 0.1680622100830078, 0.17551040649414062, 0.18295860290527344, 0.19040679931640625, 0.19785499572753906, 0.20530319213867188, 0.2127513885498047, 0.2201995849609375, 0.2276477813720703, 0.23509597778320312, 0.24254417419433594, 0.24999237060546875, 0.25744056701660156, 0.2648887634277344, 0.2723369598388672, 0.27978515625]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 2.0, 6.0, 5.0, 8.0, 5.0, 8.0, 7.0, 11.0, 8.0, 12.0, 14.0, 24.0, 28.0, 31.0, 40.0, 40.0, 72.0, 79.0, 90.0, 93.0, 82.0, 69.0, 48.0, 45.0, 30.0, 21.0, 26.0, 9.0, 19.0, 16.0, 8.0, 7.0, 7.0, 7.0, 9.0, 3.0, 6.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9262692332267761, -0.8952776789665222, -0.8642861843109131, -0.8332946300506592, -0.8023030757904053, -0.7713115811347961, -0.7403200268745422, -0.7093285322189331, -0.6783369779586792, -0.6473454236984253, -0.6163539290428162, -0.5853623747825623, -0.5543708801269531, -0.5233793258666992, -0.4923877716064453, -0.4613962471485138, -0.4304047226905823, -0.39941319823265076, -0.36842167377471924, -0.33743011951446533, -0.3064385950565338, -0.2754470705986023, -0.24445553123950958, -0.21346399188041687, -0.18247246742248535, -0.15148094296455383, -0.12048940360546112, -0.089497871696949, -0.05850633978843689, -0.02751481533050537, 0.0034767240285873413, 0.034468263387680054, 0.06545984745025635, 0.09645137935876846, 0.12744291126728058, 0.1584344506263733, 0.1894259750843048, 0.22041749954223633, 0.25140905380249023, 0.28240057826042175, 0.31339210271835327, 0.3443836271762848, 0.3753751516342163, 0.4063667058944702, 0.43735823035240173, 0.46834975481033325, 0.49934130907058716, 0.5303328037261963, 0.5613243579864502, 0.5923159122467041, 0.6233074069023132, 0.6542989611625671, 0.6852904558181763, 0.7162820100784302, 0.7472735643386841, 0.778265118598938, 0.8092566132545471, 0.840248167514801, 0.8712396621704102, 0.9022312164306641, 0.933222770690918, 0.9642142653465271, 0.995205819606781, 1.0261973142623901, 1.057188868522644]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 3.0, 4.0, 3.0, 8.0, 4.0, 9.0, 9.0, 9.0, 7.0, 10.0, 12.0, 13.0, 22.0, 19.0, 26.0, 20.0, 19.0, 25.0, 40.0, 32.0, 32.0, 38.0, 35.0, 46.0, 42.0, 32.0, 43.0, 35.0, 29.0, 40.0, 26.0, 41.0, 34.0, 25.0, 32.0, 19.0, 19.0, 20.0, 13.0, 21.0, 17.0, 15.0, 8.0, 15.0, 7.0, 9.0, 5.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.887511134147644, -0.8601676225662231, -0.8328241109848022, -0.8054805994033813, -0.7781370878219604, -0.7507935762405396, -0.7234500646591187, -0.6961065530776978, -0.6687630414962769, -0.641419529914856, -0.6140760183334351, -0.5867325067520142, -0.5593889951705933, -0.5320454835891724, -0.5047019720077515, -0.47735849022865295, -0.45001500844955444, -0.42267149686813354, -0.39532798528671265, -0.36798447370529175, -0.34064096212387085, -0.31329745054244995, -0.28595396876335144, -0.25861045718193054, -0.23126694560050964, -0.20392343401908875, -0.17657992243766785, -0.14923642575740814, -0.12189291417598724, -0.09454940259456635, -0.06720590591430664, -0.03986239433288574, -0.012518882751464844, 0.014824625104665756, 0.042168132960796356, 0.06951163709163666, 0.09685514867305756, 0.12419866025447845, 0.15154215693473816, 0.17888566851615906, 0.20622918009757996, 0.23357269167900085, 0.26091620326042175, 0.28825968503952026, 0.31560319662094116, 0.34294670820236206, 0.37029021978378296, 0.39763373136520386, 0.42497724294662476, 0.45232075452804565, 0.47966426610946655, 0.5070077776908875, 0.5343512892723083, 0.5616948008537292, 0.5890382528305054, 0.6163817644119263, 0.6437252759933472, 0.6710687875747681, 0.698412299156189, 0.7257558107376099, 0.7530993223190308, 0.7804428339004517, 0.8077863454818726, 0.8351298570632935, 0.8624733686447144]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 3.0, 11.0, 9.0, 12.0, 18.0, 27.0, 44.0, 63.0, 109.0, 156.0, 289.0, 356.0, 569.0, 882.0, 1322.0, 2009.0, 3092.0, 4805.0, 7461.0, 11802.0, 18450.0, 30393.0, 51271.0, 92146.0, 184229.0, 493159.0, 1582707.0, 1073382.0, 315077.0, 137764.0, 72823.0, 40756.0, 24537.0, 14991.0, 9658.0, 6322.0, 4311.0, 2812.0, 1912.0, 1374.0, 948.0, 658.0, 483.0, 322.0, 219.0, 156.0, 126.0, 84.0, 62.0, 45.0, 18.0, 19.0, 12.0, 13.0, 3.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0], "bins": [-1.0546875, -1.0193023681640625, -0.983917236328125, -0.9485321044921875, -0.91314697265625, -0.8777618408203125, -0.842376708984375, -0.8069915771484375, -0.7716064453125, -0.7362213134765625, -0.700836181640625, -0.6654510498046875, -0.63006591796875, -0.5946807861328125, -0.559295654296875, -0.5239105224609375, -0.488525390625, -0.4531402587890625, -0.417755126953125, -0.3823699951171875, -0.34698486328125, -0.3115997314453125, -0.276214599609375, -0.2408294677734375, -0.2054443359375, -0.1700592041015625, -0.134674072265625, -0.0992889404296875, -0.06390380859375, -0.0285186767578125, 0.006866455078125, 0.0422515869140625, 0.07763671875, 0.1130218505859375, 0.148406982421875, 0.1837921142578125, 0.21917724609375, 0.2545623779296875, 0.289947509765625, 0.3253326416015625, 0.3607177734375, 0.3961029052734375, 0.431488037109375, 0.4668731689453125, 0.50225830078125, 0.5376434326171875, 0.573028564453125, 0.6084136962890625, 0.643798828125, 0.6791839599609375, 0.714569091796875, 0.7499542236328125, 0.78533935546875, 0.8207244873046875, 0.856109619140625, 0.8914947509765625, 0.9268798828125, 0.9622650146484375, 0.997650146484375, 1.0330352783203125, 1.06842041015625, 1.1038055419921875, 1.139190673828125, 1.1745758056640625, 1.2099609375]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 8.0, 6.0, 7.0, 6.0, 12.0, 4.0, 12.0, 12.0, 16.0, 23.0, 21.0, 22.0, 21.0, 30.0, 33.0, 23.0, 29.0, 41.0, 38.0, 43.0, 34.0, 32.0, 39.0, 47.0, 47.0, 32.0, 35.0, 29.0, 31.0, 20.0, 33.0, 29.0, 28.0, 21.0, 18.0, 12.0, 19.0, 14.0, 10.0, 12.0, 12.0, 8.0, 8.0, 4.0, 2.0, 5.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.55419921875, -0.5369873046875, -0.519775390625, -0.5025634765625, -0.4853515625, -0.4681396484375, -0.450927734375, -0.4337158203125, -0.41650390625, -0.3992919921875, -0.382080078125, -0.3648681640625, -0.34765625, -0.3304443359375, -0.313232421875, -0.2960205078125, -0.27880859375, -0.2615966796875, -0.244384765625, -0.2271728515625, -0.2099609375, -0.1927490234375, -0.175537109375, -0.1583251953125, -0.14111328125, -0.1239013671875, -0.106689453125, -0.0894775390625, -0.072265625, -0.0550537109375, -0.037841796875, -0.0206298828125, -0.00341796875, 0.0137939453125, 0.031005859375, 0.0482177734375, 0.0654296875, 0.0826416015625, 0.099853515625, 0.1170654296875, 0.13427734375, 0.1514892578125, 0.168701171875, 0.1859130859375, 0.203125, 0.2203369140625, 0.237548828125, 0.2547607421875, 0.27197265625, 0.2891845703125, 0.306396484375, 0.3236083984375, 0.3408203125, 0.3580322265625, 0.375244140625, 0.3924560546875, 0.40966796875, 0.4268798828125, 0.444091796875, 0.4613037109375, 0.478515625, 0.4957275390625, 0.512939453125, 0.5301513671875, 0.54736328125]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 5.0, 17.0, 15.0, 21.0, 28.0, 44.0, 58.0, 95.0, 153.0, 191.0, 296.0, 404.0, 589.0, 824.0, 1213.0, 1775.0, 2615.0, 3854.0, 5936.0, 9130.0, 14156.0, 22049.0, 35749.0, 61134.0, 108412.0, 206001.0, 443696.0, 1179289.0, 1177987.0, 444456.0, 205133.0, 107993.0, 61089.0, 36476.0, 22170.0, 13970.0, 9117.0, 5864.0, 3872.0, 2661.0, 1809.0, 1229.0, 823.0, 575.0, 409.0, 274.0, 196.0, 133.0, 96.0, 58.0, 48.0, 40.0, 27.0, 16.0, 10.0, 9.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.84765625, -0.8203125, -0.79296875, -0.765625, -0.73828125, -0.7109375, -0.68359375, -0.65625, -0.62890625, -0.6015625, -0.57421875, -0.546875, -0.51953125, -0.4921875, -0.46484375, -0.4375, -0.41015625, -0.3828125, -0.35546875, -0.328125, -0.30078125, -0.2734375, -0.24609375, -0.21875, -0.19140625, -0.1640625, -0.13671875, -0.109375, -0.08203125, -0.0546875, -0.02734375, 0.0, 0.02734375, 0.0546875, 0.08203125, 0.109375, 0.13671875, 0.1640625, 0.19140625, 0.21875, 0.24609375, 0.2734375, 0.30078125, 0.328125, 0.35546875, 0.3828125, 0.41015625, 0.4375, 0.46484375, 0.4921875, 0.51953125, 0.546875, 0.57421875, 0.6015625, 0.62890625, 0.65625, 0.68359375, 0.7109375, 0.73828125, 0.765625, 0.79296875, 0.8203125, 0.84765625, 0.875, 0.90234375]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 4.0, 5.0, 3.0, 7.0, 18.0, 13.0, 17.0, 26.0, 26.0, 28.0, 43.0, 44.0, 58.0, 78.0, 91.0, 108.0, 138.0, 161.0, 185.0, 175.0, 215.0, 245.0, 285.0, 273.0, 271.0, 246.0, 203.0, 167.0, 159.0, 137.0, 116.0, 80.0, 77.0, 69.0, 67.0, 36.0, 30.0, 34.0, 25.0, 17.0, 20.0, 17.0, 12.0, 9.0, 13.0, 6.0, 7.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.293701171875, -0.2847023010253906, -0.27570343017578125, -0.2667045593261719, -0.2577056884765625, -0.24870681762695312, -0.23970794677734375, -0.23070907592773438, -0.221710205078125, -0.21271133422851562, -0.20371246337890625, -0.19471359252929688, -0.1857147216796875, -0.17671585083007812, -0.16771697998046875, -0.15871810913085938, -0.14971923828125, -0.14072036743164062, -0.13172149658203125, -0.12272262573242188, -0.1137237548828125, -0.10472488403320312, -0.09572601318359375, -0.08672714233398438, -0.077728271484375, -0.06872940063476562, -0.05973052978515625, -0.050731658935546875, -0.0417327880859375, -0.032733917236328125, -0.02373504638671875, -0.014736175537109375, -0.0057373046875, 0.003261566162109375, 0.01226043701171875, 0.021259307861328125, 0.0302581787109375, 0.039257049560546875, 0.04825592041015625, 0.057254791259765625, 0.066253662109375, 0.07525253295898438, 0.08425140380859375, 0.09325027465820312, 0.1022491455078125, 0.11124801635742188, 0.12024688720703125, 0.12924575805664062, 0.13824462890625, 0.14724349975585938, 0.15624237060546875, 0.16524124145507812, 0.1742401123046875, 0.18323898315429688, 0.19223785400390625, 0.20123672485351562, 0.210235595703125, 0.21923446655273438, 0.22823333740234375, 0.23723220825195312, 0.2462310791015625, 0.2552299499511719, 0.26422882080078125, 0.2732276916503906, 0.2822265625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 2.0, 4.0, 5.0, 5.0, 5.0, 6.0, 5.0, 11.0, 10.0, 19.0, 21.0, 31.0, 40.0, 37.0, 44.0, 53.0, 68.0, 85.0, 111.0, 81.0, 68.0, 48.0, 36.0, 40.0, 34.0, 21.0, 27.0, 10.0, 12.0, 11.0, 12.0, 6.0, 2.0, 4.0, 6.0, 8.0, 7.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7835121750831604, -0.7607682943344116, -0.7380244135856628, -0.7152805328369141, -0.6925366520881653, -0.6697927713394165, -0.6470488905906677, -0.624305009841919, -0.6015611290931702, -0.5788172483444214, -0.5560733675956726, -0.5333294868469238, -0.510585606098175, -0.48784172534942627, -0.4650978446006775, -0.4423539638519287, -0.41961008310317993, -0.39686620235443115, -0.3741223216056824, -0.3513784408569336, -0.3286345601081848, -0.30589067935943604, -0.28314679861068726, -0.2604029178619385, -0.2376590371131897, -0.21491515636444092, -0.19217127561569214, -0.16942739486694336, -0.14668351411819458, -0.1239396333694458, -0.10119575262069702, -0.07845187187194824, -0.05570793151855469, -0.03296405076980591, -0.010220170021057129, 0.01252371072769165, 0.03526759147644043, 0.05801147222518921, 0.08075535297393799, 0.10349923372268677, 0.12624311447143555, 0.14898699522018433, 0.1717308759689331, 0.19447475671768188, 0.21721863746643066, 0.23996251821517944, 0.2627063989639282, 0.285450279712677, 0.3081941604614258, 0.33093804121017456, 0.35368192195892334, 0.3764258027076721, 0.3991696834564209, 0.4219135642051697, 0.44465744495391846, 0.46740132570266724, 0.490145206451416, 0.5128890872001648, 0.5356329679489136, 0.5583768486976624, 0.5811207294464111, 0.6038646101951599, 0.6266084909439087, 0.6493523716926575, 0.6720962524414062]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 9.0, 7.0, 10.0, 11.0, 7.0, 11.0, 18.0, 21.0, 12.0, 29.0, 21.0, 25.0, 25.0, 39.0, 32.0, 36.0, 55.0, 44.0, 31.0, 34.0, 40.0, 38.0, 46.0, 43.0, 40.0, 34.0, 39.0, 23.0, 22.0, 35.0, 20.0, 28.0, 14.0, 23.0, 12.0, 20.0, 8.0, 11.0, 9.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6366131901741028, -0.6156259179115295, -0.5946385860443115, -0.5736513137817383, -0.552664041519165, -0.531676709651947, -0.5106894373893738, -0.48970213532447815, -0.4687148332595825, -0.4477275311946869, -0.42674022912979126, -0.405752956867218, -0.3847656548023224, -0.36377835273742676, -0.3427910804748535, -0.3218037784099579, -0.30081647634506226, -0.2798291742801666, -0.258841872215271, -0.23785459995269775, -0.21686729788780212, -0.1958799958229065, -0.17489270865917206, -0.15390542149543762, -0.132918119430542, -0.11193082481622696, -0.09094353020191193, -0.0699562355875969, -0.04896894097328186, -0.027981646358966827, -0.006994351744651794, 0.013992935419082642, 0.034980177879333496, 0.05596747249364853, 0.07695476710796356, 0.0979420617222786, 0.11892935633659363, 0.13991665840148926, 0.1609039455652237, 0.18189123272895813, 0.20287853479385376, 0.2238658368587494, 0.24485312402248383, 0.26584041118621826, 0.2868277132511139, 0.3078150153160095, 0.32880228757858276, 0.3497895896434784, 0.370776891708374, 0.39176419377326965, 0.4127514958381653, 0.4337387681007385, 0.45472607016563416, 0.4757133722305298, 0.496700644493103, 0.5176879167556763, 0.5386752486228943, 0.5596625208854675, 0.5806498527526855, 0.6016371250152588, 0.622624397277832, 0.64361172914505, 0.6645990014076233, 0.6855863332748413, 0.7065736055374146]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 1.0, 5.0, 4.0, 10.0, 15.0, 23.0, 43.0, 54.0, 72.0, 115.0, 185.0, 254.0, 330.0, 537.0, 797.0, 1171.0, 1640.0, 2429.0, 3574.0, 5250.0, 8194.0, 12535.0, 20067.0, 33239.0, 57338.0, 104550.0, 195282.0, 252716.0, 148715.0, 80009.0, 45009.0, 26812.0, 16438.0, 10547.0, 6721.0, 4484.0, 3121.0, 1956.0, 1420.0, 895.0, 636.0, 432.0, 316.0, 185.0, 112.0, 112.0, 66.0, 44.0, 35.0, 20.0, 21.0, 12.0, 6.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.27978515625, -0.27054595947265625, -0.2613067626953125, -0.25206756591796875, -0.242828369140625, -0.23358917236328125, -0.2243499755859375, -0.21511077880859375, -0.20587158203125, -0.19663238525390625, -0.1873931884765625, -0.17815399169921875, -0.168914794921875, -0.15967559814453125, -0.1504364013671875, -0.14119720458984375, -0.1319580078125, -0.12271881103515625, -0.1134796142578125, -0.10424041748046875, -0.095001220703125, -0.08576202392578125, -0.0765228271484375, -0.06728363037109375, -0.05804443359375, -0.04880523681640625, -0.0395660400390625, -0.03032684326171875, -0.021087646484375, -0.01184844970703125, -0.0026092529296875, 0.00662994384765625, 0.015869140625, 0.02510833740234375, 0.0343475341796875, 0.04358673095703125, 0.052825927734375, 0.06206512451171875, 0.0713043212890625, 0.08054351806640625, 0.08978271484375, 0.09902191162109375, 0.1082611083984375, 0.11750030517578125, 0.126739501953125, 0.13597869873046875, 0.1452178955078125, 0.15445709228515625, 0.1636962890625, 0.17293548583984375, 0.1821746826171875, 0.19141387939453125, 0.200653076171875, 0.20989227294921875, 0.2191314697265625, 0.22837066650390625, 0.23760986328125, 0.24684906005859375, 0.2560882568359375, 0.26532745361328125, 0.274566650390625, 0.28380584716796875, 0.2930450439453125, 0.30228424072265625, 0.3115234375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 0.0, 5.0, 8.0, 1.0, 7.0, 8.0, 9.0, 8.0, 11.0, 15.0, 18.0, 19.0, 17.0, 30.0, 21.0, 31.0, 37.0, 36.0, 35.0, 33.0, 49.0, 37.0, 39.0, 38.0, 37.0, 40.0, 51.0, 36.0, 41.0, 35.0, 32.0, 32.0, 29.0, 25.0, 19.0, 18.0, 18.0, 14.0, 16.0, 11.0, 13.0, 7.0, 6.0, 3.0, 7.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64794921875, -0.6268157958984375, -0.605682373046875, -0.5845489501953125, -0.56341552734375, -0.5422821044921875, -0.521148681640625, -0.5000152587890625, -0.4788818359375, -0.4577484130859375, -0.436614990234375, -0.4154815673828125, -0.39434814453125, -0.3732147216796875, -0.352081298828125, -0.3309478759765625, -0.309814453125, -0.2886810302734375, -0.267547607421875, -0.2464141845703125, -0.22528076171875, -0.2041473388671875, -0.183013916015625, -0.1618804931640625, -0.1407470703125, -0.1196136474609375, -0.098480224609375, -0.0773468017578125, -0.05621337890625, -0.0350799560546875, -0.013946533203125, 0.0071868896484375, 0.0283203125, 0.0494537353515625, 0.070587158203125, 0.0917205810546875, 0.11285400390625, 0.1339874267578125, 0.155120849609375, 0.1762542724609375, 0.1973876953125, 0.2185211181640625, 0.239654541015625, 0.2607879638671875, 0.28192138671875, 0.3030548095703125, 0.324188232421875, 0.3453216552734375, 0.366455078125, 0.3875885009765625, 0.408721923828125, 0.4298553466796875, 0.45098876953125, 0.4721221923828125, 0.493255615234375, 0.5143890380859375, 0.5355224609375, 0.5566558837890625, 0.577789306640625, 0.5989227294921875, 0.62005615234375, 0.6411895751953125, 0.662322998046875, 0.6834564208984375, 0.70458984375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [8.0, 3.0, 9.0, 5.0, 7.0, 23.0, 14.0, 20.0, 45.0, 46.0, 76.0, 78.0, 102.0, 129.0, 216.0, 292.0, 413.0, 576.0, 768.0, 1029.0, 1440.0, 1985.0, 2864.0, 4312.0, 6478.0, 10481.0, 18749.0, 38347.0, 89817.0, 260550.0, 374906.0, 124397.0, 50402.0, 23771.0, 12254.0, 7606.0, 4749.0, 3342.0, 2252.0, 1653.0, 1150.0, 863.0, 664.0, 472.0, 342.0, 233.0, 189.0, 138.0, 91.0, 57.0, 43.0, 29.0, 25.0, 19.0, 17.0, 10.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0], "bins": [-0.367919921875, -0.3557243347167969, -0.34352874755859375, -0.3313331604003906, -0.3191375732421875, -0.3069419860839844, -0.29474639892578125, -0.2825508117675781, -0.270355224609375, -0.2581596374511719, -0.24596405029296875, -0.23376846313476562, -0.2215728759765625, -0.20937728881835938, -0.19718170166015625, -0.18498611450195312, -0.17279052734375, -0.16059494018554688, -0.14839935302734375, -0.13620376586914062, -0.1240081787109375, -0.11181259155273438, -0.09961700439453125, -0.08742141723632812, -0.075225830078125, -0.06303024291992188, -0.05083465576171875, -0.038639068603515625, -0.0264434814453125, -0.014247894287109375, -0.00205230712890625, 0.010143280029296875, 0.0223388671875, 0.034534454345703125, 0.04673004150390625, 0.058925628662109375, 0.0711212158203125, 0.08331680297851562, 0.09551239013671875, 0.10770797729492188, 0.119903564453125, 0.13209915161132812, 0.14429473876953125, 0.15649032592773438, 0.1686859130859375, 0.18088150024414062, 0.19307708740234375, 0.20527267456054688, 0.21746826171875, 0.22966384887695312, 0.24185943603515625, 0.2540550231933594, 0.2662506103515625, 0.2784461975097656, 0.29064178466796875, 0.3028373718261719, 0.315032958984375, 0.3272285461425781, 0.33942413330078125, 0.3516197204589844, 0.3638153076171875, 0.3760108947753906, 0.38820648193359375, 0.4004020690917969, 0.41259765625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 4.0, 7.0, 10.0, 12.0, 12.0, 10.0, 18.0, 13.0, 22.0, 31.0, 18.0, 27.0, 26.0, 22.0, 27.0, 29.0, 37.0, 35.0, 43.0, 37.0, 29.0, 29.0, 52.0, 38.0, 24.0, 42.0, 39.0, 31.0, 23.0, 39.0, 18.0, 27.0, 27.0, 20.0, 24.0, 13.0, 12.0, 10.0, 16.0, 12.0, 8.0, 8.0, 3.0, 5.0, 3.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.35986328125, -0.3481788635253906, -0.33649444580078125, -0.3248100280761719, -0.3131256103515625, -0.3014411926269531, -0.28975677490234375, -0.2780723571777344, -0.266387939453125, -0.2547035217285156, -0.24301910400390625, -0.23133468627929688, -0.2196502685546875, -0.20796585083007812, -0.19628143310546875, -0.18459701538085938, -0.17291259765625, -0.16122817993164062, -0.14954376220703125, -0.13785934448242188, -0.1261749267578125, -0.11449050903320312, -0.10280609130859375, -0.09112167358398438, -0.079437255859375, -0.06775283813476562, -0.05606842041015625, -0.044384002685546875, -0.0326995849609375, -0.021015167236328125, -0.00933074951171875, 0.002353668212890625, 0.0140380859375, 0.025722503662109375, 0.03740692138671875, 0.049091339111328125, 0.0607757568359375, 0.07246017456054688, 0.08414459228515625, 0.09582901000976562, 0.107513427734375, 0.11919784545898438, 0.13088226318359375, 0.14256668090820312, 0.1542510986328125, 0.16593551635742188, 0.17761993408203125, 0.18930435180664062, 0.20098876953125, 0.21267318725585938, 0.22435760498046875, 0.23604202270507812, 0.2477264404296875, 0.2594108581542969, 0.27109527587890625, 0.2827796936035156, 0.294464111328125, 0.3061485290527344, 0.31783294677734375, 0.3295173645019531, 0.3412017822265625, 0.3528861999511719, 0.36457061767578125, 0.3762550354003906, 0.387939453125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 1.0, 5.0, 11.0, 3.0, 19.0, 8.0, 26.0, 29.0, 44.0, 61.0, 86.0, 96.0, 169.0, 209.0, 274.0, 436.0, 479.0, 748.0, 1047.0, 1521.0, 2203.0, 3315.0, 5168.0, 8620.0, 15600.0, 31458.0, 79891.0, 471391.0, 295720.0, 65822.0, 27502.0, 13996.0, 7826.0, 4804.0, 2979.0, 1987.0, 1330.0, 1010.0, 714.0, 507.0, 390.0, 286.0, 213.0, 154.0, 108.0, 77.0, 70.0, 41.0, 36.0, 24.0, 14.0, 7.0, 5.0, 10.0, 5.0, 3.0, 1.0, 2.0], "bins": [-0.05657958984375, -0.054911136627197266, -0.05324268341064453, -0.0515742301940918, -0.04990577697753906, -0.04823732376098633, -0.046568870544433594, -0.04490041732788086, -0.043231964111328125, -0.04156351089477539, -0.039895057678222656, -0.03822660446166992, -0.03655815124511719, -0.03488969802856445, -0.03322124481201172, -0.031552791595458984, -0.02988433837890625, -0.028215885162353516, -0.02654743194580078, -0.024878978729248047, -0.023210525512695312, -0.021542072296142578, -0.019873619079589844, -0.01820516586303711, -0.016536712646484375, -0.01486825942993164, -0.013199806213378906, -0.011531352996826172, -0.009862899780273438, -0.008194446563720703, -0.006525993347167969, -0.004857540130615234, -0.0031890869140625, -0.0015206336975097656, 0.00014781951904296875, 0.0018162727355957031, 0.0034847259521484375, 0.005153179168701172, 0.006821632385253906, 0.00849008560180664, 0.010158538818359375, 0.01182699203491211, 0.013495445251464844, 0.015163898468017578, 0.016832351684570312, 0.018500804901123047, 0.02016925811767578, 0.021837711334228516, 0.02350616455078125, 0.025174617767333984, 0.02684307098388672, 0.028511524200439453, 0.030179977416992188, 0.03184843063354492, 0.033516883850097656, 0.03518533706665039, 0.036853790283203125, 0.03852224349975586, 0.040190696716308594, 0.04185914993286133, 0.04352760314941406, 0.0451960563659668, 0.04686450958251953, 0.048532962799072266, 0.050201416015625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 4.0, 3.0, 5.0, 4.0, 8.0, 7.0, 13.0, 14.0, 27.0, 29.0, 45.0, 41.0, 76.0, 109.0, 136.0, 161.0, 90.0, 54.0, 34.0, 43.0, 13.0, 24.0, 11.0, 14.0, 8.0, 6.0, 3.0, 4.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.470348358154297e-06, -4.3371692299842834e-06, -4.20399010181427e-06, -4.070810973644257e-06, -3.937631845474243e-06, -3.8044527173042297e-06, -3.6712735891342163e-06, -3.538094460964203e-06, -3.4049153327941895e-06, -3.271736204624176e-06, -3.1385570764541626e-06, -3.005377948284149e-06, -2.8721988201141357e-06, -2.7390196919441223e-06, -2.605840563774109e-06, -2.4726614356040955e-06, -2.339482307434082e-06, -2.2063031792640686e-06, -2.073124051094055e-06, -1.9399449229240417e-06, -1.8067657947540283e-06, -1.6735866665840149e-06, -1.5404075384140015e-06, -1.407228410243988e-06, -1.2740492820739746e-06, -1.1408701539039612e-06, -1.0076910257339478e-06, -8.745118975639343e-07, -7.413327693939209e-07, -6.081536412239075e-07, -4.7497451305389404e-07, -3.417953848838806e-07, -2.086162567138672e-07, -7.543712854385376e-08, 5.774199962615967e-08, 1.909211277961731e-07, 3.241002559661865e-07, 4.5727938413619995e-07, 5.904585123062134e-07, 7.236376404762268e-07, 8.568167686462402e-07, 9.899958968162537e-07, 1.123175024986267e-06, 1.2563541531562805e-06, 1.389533281326294e-06, 1.5227124094963074e-06, 1.6558915376663208e-06, 1.7890706658363342e-06, 1.9222497940063477e-06, 2.055428922176361e-06, 2.1886080503463745e-06, 2.321787178516388e-06, 2.4549663066864014e-06, 2.588145434856415e-06, 2.7213245630264282e-06, 2.8545036911964417e-06, 2.987682819366455e-06, 3.1208619475364685e-06, 3.254041075706482e-06, 3.3872202038764954e-06, 3.520399332046509e-06, 3.6535784602165222e-06, 3.7867575883865356e-06, 3.919936716556549e-06, 4.0531158447265625e-06]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 3.0, 5.0, 16.0, 15.0, 18.0, 17.0, 24.0, 46.0, 64.0, 102.0, 142.0, 203.0, 300.0, 426.0, 622.0, 952.0, 1474.0, 2197.0, 3561.0, 5761.0, 10377.0, 19358.0, 41343.0, 104680.0, 417373.0, 282583.0, 82687.0, 34052.0, 16830.0, 9100.0, 5163.0, 3094.0, 1936.0, 1310.0, 890.0, 563.0, 347.0, 295.0, 205.0, 110.0, 94.0, 59.0, 41.0, 39.0, 28.0, 16.0, 10.0, 8.0, 3.0, 6.0, 6.0, 4.0, 1.0, 2.0, 2.0], "bins": [-0.05926513671875, -0.05751609802246094, -0.055767059326171875, -0.05401802062988281, -0.05226898193359375, -0.05051994323730469, -0.048770904541015625, -0.04702186584472656, -0.0452728271484375, -0.04352378845214844, -0.041774749755859375, -0.04002571105957031, -0.03827667236328125, -0.03652763366699219, -0.034778594970703125, -0.03302955627441406, -0.031280517578125, -0.029531478881835938, -0.027782440185546875, -0.026033401489257812, -0.02428436279296875, -0.022535324096679688, -0.020786285400390625, -0.019037246704101562, -0.0172882080078125, -0.015539169311523438, -0.013790130615234375, -0.012041091918945312, -0.01029205322265625, -0.008543014526367188, -0.006793975830078125, -0.0050449371337890625, -0.0032958984375, -0.0015468597412109375, 0.000202178955078125, 0.0019512176513671875, 0.00370025634765625, 0.0054492950439453125, 0.007198333740234375, 0.008947372436523438, 0.0106964111328125, 0.012445449829101562, 0.014194488525390625, 0.015943527221679688, 0.01769256591796875, 0.019441604614257812, 0.021190643310546875, 0.022939682006835938, 0.024688720703125, 0.026437759399414062, 0.028186798095703125, 0.029935836791992188, 0.03168487548828125, 0.03343391418457031, 0.035182952880859375, 0.03693199157714844, 0.0386810302734375, 0.04043006896972656, 0.042179107666015625, 0.04392814636230469, 0.04567718505859375, 0.04742622375488281, 0.049175262451171875, 0.05092430114746094, 0.05267333984375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 8.0, 7.0, 1.0, 7.0, 7.0, 10.0, 15.0, 17.0, 19.0, 28.0, 28.0, 40.0, 51.0, 59.0, 77.0, 119.0, 109.0, 100.0, 57.0, 55.0, 37.0, 21.0, 20.0, 24.0, 18.0, 9.0, 12.0, 9.0, 10.0, 5.0, 7.0, 7.0, 5.0, 4.0, 0.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0131683349609375, -0.012814044952392578, -0.012459754943847656, -0.012105464935302734, -0.011751174926757812, -0.01139688491821289, -0.011042594909667969, -0.010688304901123047, -0.010334014892578125, -0.009979724884033203, -0.009625434875488281, -0.00927114486694336, -0.008916854858398438, -0.008562564849853516, -0.008208274841308594, -0.007853984832763672, -0.00749969482421875, -0.007145404815673828, -0.006791114807128906, -0.006436824798583984, -0.0060825347900390625, -0.005728244781494141, -0.005373954772949219, -0.005019664764404297, -0.004665374755859375, -0.004311084747314453, -0.003956794738769531, -0.0036025047302246094, -0.0032482147216796875, -0.0028939247131347656, -0.0025396347045898438, -0.002185344696044922, -0.0018310546875, -0.0014767646789550781, -0.0011224746704101562, -0.0007681846618652344, -0.0004138946533203125, -5.9604644775390625e-05, 0.00029468536376953125, 0.0006489753723144531, 0.001003265380859375, 0.0013575553894042969, 0.0017118453979492188, 0.0020661354064941406, 0.0024204254150390625, 0.0027747154235839844, 0.0031290054321289062, 0.003483295440673828, 0.00383758544921875, 0.004191875457763672, 0.004546165466308594, 0.004900455474853516, 0.0052547454833984375, 0.005609035491943359, 0.005963325500488281, 0.006317615509033203, 0.006671905517578125, 0.007026195526123047, 0.007380485534667969, 0.007734775543212891, 0.008089065551757812, 0.008443355560302734, 0.008797645568847656, 0.009151935577392578, 0.0095062255859375]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 9.0, 1.0, 4.0, 6.0, 6.0, 6.0, 4.0, 5.0, 10.0, 20.0, 17.0, 31.0, 37.0, 45.0, 37.0, 61.0, 54.0, 87.0, 104.0, 93.0, 71.0, 55.0, 40.0, 40.0, 39.0, 23.0, 17.0, 10.0, 13.0, 16.0, 7.0, 5.0, 4.0, 4.0, 6.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.780517578125, -0.7572737336158752, -0.7340299487113953, -0.7107861042022705, -0.6875423192977905, -0.6642984747886658, -0.641054630279541, -0.617810845375061, -0.5945670008659363, -0.5713231563568115, -0.5480793714523315, -0.5248355269432068, -0.501591682434082, -0.47834789752960205, -0.4551040530204773, -0.4318602383136749, -0.40861642360687256, -0.3853726089000702, -0.3621287941932678, -0.33888494968414307, -0.3156411349773407, -0.29239732027053833, -0.2691534757614136, -0.2459096610546112, -0.22266584634780884, -0.19942203164100647, -0.1761782020330429, -0.15293437242507935, -0.12969055771827698, -0.10644673556089401, -0.08320291340351105, -0.059959083795547485, -0.03671520948410034, -0.013471387326717377, 0.009772434830665588, 0.03301625698804855, 0.05626007914543152, 0.07950390130281448, 0.10274772346019745, 0.125991553068161, 0.14923536777496338, 0.17247918248176575, 0.1957230120897293, 0.21896684169769287, 0.24221065640449524, 0.2654544711112976, 0.28869831562042236, 0.31194213032722473, 0.3351859450340271, 0.35842975974082947, 0.38167357444763184, 0.4049174189567566, 0.42816123366355896, 0.45140504837036133, 0.4746488928794861, 0.49789270758628845, 0.5211365222930908, 0.5443803668022156, 0.5676241517066956, 0.5908679962158203, 0.6141117811203003, 0.637355625629425, 0.6605994701385498, 0.6838432550430298, 0.7070870995521545]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 9.0, 7.0, 11.0, 10.0, 8.0, 11.0, 17.0, 23.0, 12.0, 27.0, 21.0, 24.0, 31.0, 37.0, 28.0, 39.0, 57.0, 45.0, 29.0, 34.0, 42.0, 36.0, 43.0, 49.0, 36.0, 38.0, 33.0, 24.0, 26.0, 33.0, 18.0, 29.0, 15.0, 20.0, 13.0, 21.0, 7.0, 12.0, 7.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.626660943031311, -0.6058785915374756, -0.5850962400436401, -0.5643138885498047, -0.5435315370559692, -0.5227491855621338, -0.5019668340682983, -0.4811844229698181, -0.46040207147598267, -0.4396197199821472, -0.41883736848831177, -0.3980550169944763, -0.3772726356983185, -0.35649028420448303, -0.3357079327106476, -0.31492555141448975, -0.2941432297229767, -0.27336087822914124, -0.2525785267353058, -0.23179616034030914, -0.2110137939453125, -0.19023144245147705, -0.1694490909576416, -0.14866672456264496, -0.1278843730688095, -0.10710201412439346, -0.08631965517997742, -0.06553730368614197, -0.04475494474172592, -0.023972585797309875, -0.0031902343034744263, 0.017592132091522217, 0.038374483585357666, 0.05915684252977371, 0.07993920147418976, 0.10072155296802521, 0.12150391191244125, 0.1422862708568573, 0.16306862235069275, 0.1838509887456894, 0.20463334023952484, 0.2254156917333603, 0.24619805812835693, 0.2669804096221924, 0.28776276111602783, 0.3085451126098633, 0.32932746410369873, 0.35010984539985657, 0.370892196893692, 0.39167454838752747, 0.4124568998813629, 0.43323928117752075, 0.4540216326713562, 0.47480398416519165, 0.4955863356590271, 0.5163686871528625, 0.537151038646698, 0.5579333901405334, 0.5787157416343689, 0.5994980931282043, 0.6202804446220398, 0.64106285572052, 0.6618452072143555, 0.6826275587081909, 0.7034099102020264]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 5.0, 11.0, 11.0, 11.0, 24.0, 40.0, 41.0, 74.0, 108.0, 147.0, 243.0, 350.0, 498.0, 761.0, 1146.0, 1573.0, 2548.0, 3830.0, 5912.0, 9577.0, 15459.0, 25718.0, 45237.0, 85043.0, 172595.0, 289547.0, 182039.0, 88494.0, 46960.0, 26956.0, 15987.0, 9772.0, 6119.0, 3994.0, 2522.0, 1703.0, 1081.0, 745.0, 542.0, 392.0, 217.0, 155.0, 117.0, 71.0, 64.0, 34.0, 24.0, 18.0, 15.0, 10.0, 5.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1552734375, -1.1186370849609375, -1.082000732421875, -1.0453643798828125, -1.00872802734375, -0.9720916748046875, -0.935455322265625, -0.8988189697265625, -0.8621826171875, -0.8255462646484375, -0.788909912109375, -0.7522735595703125, -0.71563720703125, -0.6790008544921875, -0.642364501953125, -0.6057281494140625, -0.569091796875, -0.5324554443359375, -0.495819091796875, -0.4591827392578125, -0.42254638671875, -0.3859100341796875, -0.349273681640625, -0.3126373291015625, -0.2760009765625, -0.2393646240234375, -0.202728271484375, -0.1660919189453125, -0.12945556640625, -0.0928192138671875, -0.056182861328125, -0.0195465087890625, 0.01708984375, 0.0537261962890625, 0.090362548828125, 0.1269989013671875, 0.16363525390625, 0.2002716064453125, 0.236907958984375, 0.2735443115234375, 0.3101806640625, 0.3468170166015625, 0.383453369140625, 0.4200897216796875, 0.45672607421875, 0.4933624267578125, 0.529998779296875, 0.5666351318359375, 0.603271484375, 0.6399078369140625, 0.676544189453125, 0.7131805419921875, 0.74981689453125, 0.7864532470703125, 0.823089599609375, 0.8597259521484375, 0.8963623046875, 0.9329986572265625, 0.969635009765625, 1.0062713623046875, 1.04290771484375, 1.0795440673828125, 1.116180419921875, 1.1528167724609375, 1.189453125]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 3.0, 11.0, 8.0, 8.0, 8.0, 14.0, 17.0, 27.0, 25.0, 27.0, 29.0, 35.0, 29.0, 43.0, 39.0, 53.0, 39.0, 46.0, 41.0, 44.0, 36.0, 45.0, 43.0, 40.0, 28.0, 44.0, 23.0, 23.0, 32.0, 26.0, 16.0, 19.0, 10.0, 22.0, 6.0, 11.0, 10.0, 7.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6171875, -0.5977249145507812, -0.5782623291015625, -0.5587997436523438, -0.539337158203125, -0.5198745727539062, -0.5004119873046875, -0.48094940185546875, -0.46148681640625, -0.44202423095703125, -0.4225616455078125, -0.40309906005859375, -0.383636474609375, -0.36417388916015625, -0.3447113037109375, -0.32524871826171875, -0.3057861328125, -0.28632354736328125, -0.2668609619140625, -0.24739837646484375, -0.227935791015625, -0.20847320556640625, -0.1890106201171875, -0.16954803466796875, -0.15008544921875, -0.13062286376953125, -0.1111602783203125, -0.09169769287109375, -0.072235107421875, -0.05277252197265625, -0.0333099365234375, -0.01384735107421875, 0.005615234375, 0.02507781982421875, 0.0445404052734375, 0.06400299072265625, 0.083465576171875, 0.10292816162109375, 0.1223907470703125, 0.14185333251953125, 0.16131591796875, 0.18077850341796875, 0.2002410888671875, 0.21970367431640625, 0.239166259765625, 0.25862884521484375, 0.2780914306640625, 0.29755401611328125, 0.3170166015625, 0.33647918701171875, 0.3559417724609375, 0.37540435791015625, 0.394866943359375, 0.41432952880859375, 0.4337921142578125, 0.45325469970703125, 0.47271728515625, 0.49217987060546875, 0.5116424560546875, 0.5311050415039062, 0.550567626953125, 0.5700302124023438, 0.5894927978515625, 0.6089553833007812, 0.62841796875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 12.0, 12.0, 16.0, 26.0, 34.0, 52.0, 65.0, 103.0, 155.0, 233.0, 342.0, 505.0, 772.0, 1176.0, 1712.0, 2769.0, 4288.0, 6886.0, 11268.0, 18474.0, 31551.0, 56660.0, 110211.0, 235039.0, 275276.0, 132577.0, 66495.0, 36708.0, 21065.0, 12620.0, 7640.0, 4908.0, 3084.0, 1930.0, 1334.0, 823.0, 547.0, 368.0, 288.0, 167.0, 123.0, 76.0, 48.0, 36.0, 28.0, 24.0, 8.0, 10.0, 5.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.11328125, -1.0786285400390625, -1.043975830078125, -1.0093231201171875, -0.97467041015625, -0.9400177001953125, -0.905364990234375, -0.8707122802734375, -0.8360595703125, -0.8014068603515625, -0.766754150390625, -0.7321014404296875, -0.69744873046875, -0.6627960205078125, -0.628143310546875, -0.5934906005859375, -0.558837890625, -0.5241851806640625, -0.489532470703125, -0.4548797607421875, -0.42022705078125, -0.3855743408203125, -0.350921630859375, -0.3162689208984375, -0.2816162109375, -0.2469635009765625, -0.212310791015625, -0.1776580810546875, -0.14300537109375, -0.1083526611328125, -0.073699951171875, -0.0390472412109375, -0.00439453125, 0.0302581787109375, 0.064910888671875, 0.0995635986328125, 0.13421630859375, 0.1688690185546875, 0.203521728515625, 0.2381744384765625, 0.2728271484375, 0.3074798583984375, 0.342132568359375, 0.3767852783203125, 0.41143798828125, 0.4460906982421875, 0.480743408203125, 0.5153961181640625, 0.550048828125, 0.5847015380859375, 0.619354248046875, 0.6540069580078125, 0.68865966796875, 0.7233123779296875, 0.757965087890625, 0.7926177978515625, 0.8272705078125, 0.8619232177734375, 0.896575927734375, 0.9312286376953125, 0.96588134765625, 1.0005340576171875, 1.035186767578125, 1.0698394775390625, 1.1044921875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 5.0, 6.0, 12.0, 8.0, 7.0, 19.0, 17.0, 13.0, 22.0, 18.0, 17.0, 35.0, 30.0, 29.0, 31.0, 44.0, 33.0, 39.0, 41.0, 39.0, 39.0, 42.0, 47.0, 41.0, 34.0, 40.0, 39.0, 40.0, 25.0, 30.0, 32.0, 19.0, 22.0, 14.0, 17.0, 11.0, 8.0, 9.0, 8.0, 10.0, 3.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.403076171875, -0.3914451599121094, -0.37981414794921875, -0.3681831359863281, -0.3565521240234375, -0.3449211120605469, -0.33329010009765625, -0.3216590881347656, -0.310028076171875, -0.2983970642089844, -0.28676605224609375, -0.2751350402832031, -0.2635040283203125, -0.2518730163574219, -0.24024200439453125, -0.22861099243164062, -0.21697998046875, -0.20534896850585938, -0.19371795654296875, -0.18208694458007812, -0.1704559326171875, -0.15882492065429688, -0.14719390869140625, -0.13556289672851562, -0.123931884765625, -0.11230087280273438, -0.10066986083984375, -0.08903884887695312, -0.0774078369140625, -0.06577682495117188, -0.05414581298828125, -0.042514801025390625, -0.0308837890625, -0.019252777099609375, -0.00762176513671875, 0.004009246826171875, 0.0156402587890625, 0.027271270751953125, 0.03890228271484375, 0.050533294677734375, 0.062164306640625, 0.07379531860351562, 0.08542633056640625, 0.09705734252929688, 0.1086883544921875, 0.12031936645507812, 0.13195037841796875, 0.14358139038085938, 0.15521240234375, 0.16684341430664062, 0.17847442626953125, 0.19010543823242188, 0.2017364501953125, 0.21336746215820312, 0.22499847412109375, 0.23662948608398438, 0.248260498046875, 0.2598915100097656, 0.27152252197265625, 0.2831535339355469, 0.2947845458984375, 0.3064155578613281, 0.31804656982421875, 0.3296775817871094, 0.34130859375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 9.0, 17.0, 37.0, 47.0, 72.0, 96.0, 134.0, 184.0, 247.0, 315.0, 481.0, 526.0, 851.0, 1030.0, 1565.0, 2219.0, 3186.0, 4454.0, 6458.0, 9561.0, 14461.0, 24553.0, 50761.0, 758958.0, 82336.0, 31776.0, 17800.0, 11148.0, 7518.0, 5151.0, 3589.0, 2558.0, 1768.0, 1319.0, 863.0, 665.0, 461.0, 353.0, 284.0, 197.0, 156.0, 120.0, 77.0, 46.0, 52.0, 28.0, 18.0, 18.0, 9.0, 7.0, 2.0, 4.0, 2.0, 2.0], "bins": [-0.8076171875, -0.7836532592773438, -0.7596893310546875, -0.7357254028320312, -0.711761474609375, -0.6877975463867188, -0.6638336181640625, -0.6398696899414062, -0.61590576171875, -0.5919418334960938, -0.5679779052734375, -0.5440139770507812, -0.520050048828125, -0.49608612060546875, -0.4721221923828125, -0.44815826416015625, -0.4241943359375, -0.40023040771484375, -0.3762664794921875, -0.35230255126953125, -0.328338623046875, -0.30437469482421875, -0.2804107666015625, -0.25644683837890625, -0.23248291015625, -0.20851898193359375, -0.1845550537109375, -0.16059112548828125, -0.136627197265625, -0.11266326904296875, -0.0886993408203125, -0.06473541259765625, -0.040771484375, -0.01680755615234375, 0.0071563720703125, 0.03112030029296875, 0.055084228515625, 0.07904815673828125, 0.1030120849609375, 0.12697601318359375, 0.15093994140625, 0.17490386962890625, 0.1988677978515625, 0.22283172607421875, 0.246795654296875, 0.27075958251953125, 0.2947235107421875, 0.31868743896484375, 0.3426513671875, 0.36661529541015625, 0.3905792236328125, 0.41454315185546875, 0.438507080078125, 0.46247100830078125, 0.4864349365234375, 0.5103988647460938, 0.53436279296875, 0.5583267211914062, 0.5822906494140625, 0.6062545776367188, 0.630218505859375, 0.6541824340820312, 0.6781463623046875, 0.7021102905273438, 0.72607421875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 5.0, 7.0, 12.0, 5.0, 12.0, 19.0, 31.0, 64.0, 475.0, 199.0, 50.0, 23.0, 20.0, 9.0, 6.0, 11.0, 6.0, 2.0, 4.0, 2.0, 6.0, 4.0, 7.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.267692565917969e-05, -4.1484832763671875e-05, -4.029273986816406e-05, -3.910064697265625e-05, -3.790855407714844e-05, -3.6716461181640625e-05, -3.552436828613281e-05, -3.4332275390625e-05, -3.314018249511719e-05, -3.1948089599609375e-05, -3.075599670410156e-05, -2.956390380859375e-05, -2.8371810913085938e-05, -2.7179718017578125e-05, -2.5987625122070312e-05, -2.47955322265625e-05, -2.3603439331054688e-05, -2.2411346435546875e-05, -2.1219253540039062e-05, -2.002716064453125e-05, -1.8835067749023438e-05, -1.7642974853515625e-05, -1.6450881958007812e-05, -1.52587890625e-05, -1.4066696166992188e-05, -1.2874603271484375e-05, -1.1682510375976562e-05, -1.049041748046875e-05, -9.298324584960938e-06, -8.106231689453125e-06, -6.9141387939453125e-06, -5.7220458984375e-06, -4.5299530029296875e-06, -3.337860107421875e-06, -2.1457672119140625e-06, -9.5367431640625e-07, 2.384185791015625e-07, 1.430511474609375e-06, 2.6226043701171875e-06, 3.814697265625e-06, 5.0067901611328125e-06, 6.198883056640625e-06, 7.3909759521484375e-06, 8.58306884765625e-06, 9.775161743164062e-06, 1.0967254638671875e-05, 1.2159347534179688e-05, 1.33514404296875e-05, 1.4543533325195312e-05, 1.5735626220703125e-05, 1.6927719116210938e-05, 1.811981201171875e-05, 1.9311904907226562e-05, 2.0503997802734375e-05, 2.1696090698242188e-05, 2.288818359375e-05, 2.4080276489257812e-05, 2.5272369384765625e-05, 2.6464462280273438e-05, 2.765655517578125e-05, 2.8848648071289062e-05, 3.0040740966796875e-05, 3.123283386230469e-05, 3.24249267578125e-05, 3.361701965332031e-05]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 5.0, 11.0, 12.0, 18.0, 26.0, 39.0, 65.0, 62.0, 112.0, 145.0, 205.0, 309.0, 420.0, 646.0, 896.0, 1383.0, 2009.0, 2892.0, 4557.0, 7080.0, 11320.0, 19482.0, 35999.0, 91783.0, 749304.0, 52614.0, 26342.0, 14845.0, 8955.0, 5725.0, 3640.0, 2399.0, 1617.0, 1143.0, 776.0, 501.0, 385.0, 253.0, 162.0, 136.0, 72.0, 65.0, 39.0, 33.0, 25.0, 18.0, 5.0, 9.0, 8.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.86962890625, -0.8418045043945312, -0.8139801025390625, -0.7861557006835938, -0.758331298828125, -0.7305068969726562, -0.7026824951171875, -0.6748580932617188, -0.64703369140625, -0.6192092895507812, -0.5913848876953125, -0.5635604858398438, -0.535736083984375, -0.5079116821289062, -0.4800872802734375, -0.45226287841796875, -0.4244384765625, -0.39661407470703125, -0.3687896728515625, -0.34096527099609375, -0.313140869140625, -0.28531646728515625, -0.2574920654296875, -0.22966766357421875, -0.20184326171875, -0.17401885986328125, -0.1461944580078125, -0.11837005615234375, -0.090545654296875, -0.06272125244140625, -0.0348968505859375, -0.00707244873046875, 0.020751953125, 0.04857635498046875, 0.0764007568359375, 0.10422515869140625, 0.132049560546875, 0.15987396240234375, 0.1876983642578125, 0.21552276611328125, 0.24334716796875, 0.27117156982421875, 0.2989959716796875, 0.32682037353515625, 0.354644775390625, 0.38246917724609375, 0.4102935791015625, 0.43811798095703125, 0.4659423828125, 0.49376678466796875, 0.5215911865234375, 0.5494155883789062, 0.577239990234375, 0.6050643920898438, 0.6328887939453125, 0.6607131958007812, 0.68853759765625, 0.7163619995117188, 0.7441864013671875, 0.7720108032226562, 0.799835205078125, 0.8276596069335938, 0.8554840087890625, 0.8833084106445312, 0.9111328125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 5.0, 4.0, 9.0, 2.0, 9.0, 1.0, 6.0, 5.0, 10.0, 12.0, 12.0, 12.0, 16.0, 17.0, 19.0, 24.0, 471.0, 151.0, 36.0, 21.0, 22.0, 21.0, 15.0, 14.0, 14.0, 17.0, 9.0, 5.0, 6.0, 10.0, 3.0, 6.0, 8.0, 2.0, 2.0, 2.0, 3.0, 0.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255126953125, -0.24688339233398438, -0.23863983154296875, -0.23039627075195312, -0.2221527099609375, -0.21390914916992188, -0.20566558837890625, -0.19742202758789062, -0.189178466796875, -0.18093490600585938, -0.17269134521484375, -0.16444778442382812, -0.1562042236328125, -0.14796066284179688, -0.13971710205078125, -0.13147354125976562, -0.12322998046875, -0.11498641967773438, -0.10674285888671875, -0.09849929809570312, -0.0902557373046875, -0.08201217651367188, -0.07376861572265625, -0.06552505493164062, -0.057281494140625, -0.049037933349609375, -0.04079437255859375, -0.032550811767578125, -0.0243072509765625, -0.016063690185546875, -0.00782012939453125, 0.000423431396484375, 0.0086669921875, 0.016910552978515625, 0.02515411376953125, 0.033397674560546875, 0.0416412353515625, 0.049884796142578125, 0.05812835693359375, 0.06637191772460938, 0.074615478515625, 0.08285903930664062, 0.09110260009765625, 0.09934616088867188, 0.1075897216796875, 0.11583328247070312, 0.12407684326171875, 0.13232040405273438, 0.14056396484375, 0.14880752563476562, 0.15705108642578125, 0.16529464721679688, 0.1735382080078125, 0.18178176879882812, 0.19002532958984375, 0.19826889038085938, 0.206512451171875, 0.21475601196289062, 0.22299957275390625, 0.23124313354492188, 0.2394866943359375, 0.24773025512695312, 0.25597381591796875, 0.2642173767089844, 0.2724609375]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 4.0, 5.0, 3.0, 6.0, 6.0, 9.0, 10.0, 10.0, 20.0, 17.0, 24.0, 35.0, 37.0, 50.0, 59.0, 81.0, 83.0, 106.0, 81.0, 67.0, 51.0, 45.0, 31.0, 25.0, 22.0, 15.0, 15.0, 17.0, 13.0, 11.0, 8.0, 10.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.6937131285667419, -0.6714305877685547, -0.6491481065750122, -0.6268656253814697, -0.6045830845832825, -0.5823005437850952, -0.5600180625915527, -0.5377355813980103, -0.515453040599823, -0.49317052960395813, -0.47088801860809326, -0.4486055076122284, -0.4263229966163635, -0.40404048562049866, -0.3817579746246338, -0.3594754636287689, -0.33719295263290405, -0.3149104416370392, -0.2926279306411743, -0.27034541964530945, -0.24806290864944458, -0.2257803976535797, -0.20349788665771484, -0.18121537566184998, -0.1589328646659851, -0.13665035367012024, -0.11436784267425537, -0.0920853316783905, -0.06980282068252563, -0.04752030968666077, -0.0252377986907959, -0.0029552876949310303, 0.019327282905578613, 0.04160979390144348, 0.06389230489730835, 0.08617481589317322, 0.10845732688903809, 0.13073983788490295, 0.15302234888076782, 0.1753048598766327, 0.19758737087249756, 0.21986988186836243, 0.2421523928642273, 0.26443490386009216, 0.28671741485595703, 0.3089999258518219, 0.33128243684768677, 0.35356494784355164, 0.3758474588394165, 0.39812996983528137, 0.42041248083114624, 0.4426949918270111, 0.464977502822876, 0.48726001381874084, 0.5095425248146057, 0.531825065612793, 0.5541075468063354, 0.5763900279998779, 0.5986725687980652, 0.6209551095962524, 0.6432375907897949, 0.6655200719833374, 0.6878026127815247, 0.7100851535797119, 0.7323676347732544]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 6.0, 6.0, 4.0, 7.0, 13.0, 14.0, 17.0, 10.0, 19.0, 28.0, 25.0, 28.0, 32.0, 42.0, 33.0, 38.0, 31.0, 31.0, 48.0, 34.0, 44.0, 41.0, 35.0, 52.0, 42.0, 40.0, 35.0, 38.0, 35.0, 21.0, 25.0, 20.0, 15.0, 27.0, 11.0, 15.0, 10.0, 8.0, 9.0, 4.0, 3.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6757290959358215, -0.6555466651916504, -0.635364294052124, -0.6151818633079529, -0.5949994325637817, -0.5748170018196106, -0.5546345710754395, -0.5344521999359131, -0.5142697691917419, -0.4940873384475708, -0.47390493750572205, -0.4537225365638733, -0.43354010581970215, -0.413357675075531, -0.39317527413368225, -0.3729928731918335, -0.35281044244766235, -0.3326280117034912, -0.31244561076164246, -0.2922632098197937, -0.27208077907562256, -0.2518983483314514, -0.23171594738960266, -0.2115335315465927, -0.19135111570358276, -0.17116869986057281, -0.15098628401756287, -0.13080386817455292, -0.11062145233154297, -0.09043903648853302, -0.07025662064552307, -0.05007420480251312, -0.029891788959503174, -0.009709373116493225, 0.010473042726516724, 0.030655458569526672, 0.05083787441253662, 0.07102029025554657, 0.09120270609855652, 0.11138512194156647, 0.13156753778457642, 0.15174995362758636, 0.1719323694705963, 0.19211478531360626, 0.2122972011566162, 0.23247961699962616, 0.2526620328426361, 0.27284443378448486, 0.293026864528656, 0.31320929527282715, 0.3333916962146759, 0.35357409715652466, 0.3737565279006958, 0.39393895864486694, 0.4141213595867157, 0.43430376052856445, 0.4544861912727356, 0.47466862201690674, 0.4948510229587555, 0.5150334239006042, 0.5352158546447754, 0.5553982853889465, 0.5755807161331177, 0.595763087272644, 0.6159455180168152]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [1.0, 5.0, 2.0, 6.0, 12.0, 22.0, 32.0, 35.0, 69.0, 84.0, 110.0, 153.0, 231.0, 292.0, 445.0, 632.0, 887.0, 1329.0, 1846.0, 2679.0, 3877.0, 5826.0, 8438.0, 12503.0, 19282.0, 29933.0, 47738.0, 78917.0, 140210.0, 279689.0, 771839.0, 1511339.0, 680896.0, 256538.0, 132054.0, 75259.0, 45803.0, 28472.0, 17959.0, 12200.0, 8368.0, 5601.0, 3725.0, 2618.0, 1863.0, 1343.0, 925.0, 653.0, 466.0, 303.0, 215.0, 167.0, 111.0, 97.0, 61.0, 45.0, 27.0, 29.0, 21.0, 11.0, 4.0, 0.0, 3.0, 4.0], "bins": [-0.634765625, -0.6145782470703125, -0.594390869140625, -0.5742034912109375, -0.55401611328125, -0.5338287353515625, -0.513641357421875, -0.4934539794921875, -0.4732666015625, -0.4530792236328125, -0.432891845703125, -0.4127044677734375, -0.39251708984375, -0.3723297119140625, -0.352142333984375, -0.3319549560546875, -0.311767578125, -0.2915802001953125, -0.271392822265625, -0.2512054443359375, -0.23101806640625, -0.2108306884765625, -0.190643310546875, -0.1704559326171875, -0.1502685546875, -0.1300811767578125, -0.109893798828125, -0.0897064208984375, -0.06951904296875, -0.0493316650390625, -0.029144287109375, -0.0089569091796875, 0.01123046875, 0.0314178466796875, 0.051605224609375, 0.0717926025390625, 0.09197998046875, 0.1121673583984375, 0.132354736328125, 0.1525421142578125, 0.1727294921875, 0.1929168701171875, 0.213104248046875, 0.2332916259765625, 0.25347900390625, 0.2736663818359375, 0.293853759765625, 0.3140411376953125, 0.334228515625, 0.3544158935546875, 0.374603271484375, 0.3947906494140625, 0.41497802734375, 0.4351654052734375, 0.455352783203125, 0.4755401611328125, 0.4957275390625, 0.5159149169921875, 0.536102294921875, 0.5562896728515625, 0.57647705078125, 0.5966644287109375, 0.616851806640625, 0.6370391845703125, 0.6572265625]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 5.0, 6.0, 5.0, 11.0, 17.0, 9.0, 13.0, 16.0, 26.0, 22.0, 24.0, 36.0, 30.0, 39.0, 36.0, 42.0, 41.0, 43.0, 56.0, 48.0, 50.0, 30.0, 50.0, 39.0, 42.0, 42.0, 38.0, 26.0, 29.0, 26.0, 16.0, 13.0, 17.0, 14.0, 14.0, 11.0, 9.0, 8.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.432861328125, -0.4195213317871094, -0.40618133544921875, -0.3928413391113281, -0.3795013427734375, -0.3661613464355469, -0.35282135009765625, -0.3394813537597656, -0.326141357421875, -0.3128013610839844, -0.29946136474609375, -0.2861213684082031, -0.2727813720703125, -0.2594413757324219, -0.24610137939453125, -0.23276138305664062, -0.21942138671875, -0.20608139038085938, -0.19274139404296875, -0.17940139770507812, -0.1660614013671875, -0.15272140502929688, -0.13938140869140625, -0.12604141235351562, -0.112701416015625, -0.09936141967773438, -0.08602142333984375, -0.07268142700195312, -0.0593414306640625, -0.046001434326171875, -0.03266143798828125, -0.019321441650390625, -0.0059814453125, 0.007358551025390625, 0.02069854736328125, 0.034038543701171875, 0.0473785400390625, 0.060718536376953125, 0.07405853271484375, 0.08739852905273438, 0.100738525390625, 0.11407852172851562, 0.12741851806640625, 0.14075851440429688, 0.1540985107421875, 0.16743850708007812, 0.18077850341796875, 0.19411849975585938, 0.20745849609375, 0.22079849243164062, 0.23413848876953125, 0.24747848510742188, 0.2608184814453125, 0.2741584777832031, 0.28749847412109375, 0.3008384704589844, 0.314178466796875, 0.3275184631347656, 0.34085845947265625, 0.3541984558105469, 0.3675384521484375, 0.3808784484863281, 0.39421844482421875, 0.4075584411621094, 0.4208984375]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 11.0, 11.0, 23.0, 38.0, 49.0, 70.0, 136.0, 154.0, 278.0, 428.0, 630.0, 959.0, 1474.0, 2345.0, 3724.0, 5747.0, 9348.0, 15266.0, 25316.0, 42642.0, 75437.0, 139761.0, 282504.0, 675304.0, 1530354.0, 738342.0, 302161.0, 148462.0, 79443.0, 45082.0, 26431.0, 15763.0, 9742.0, 6141.0, 3842.0, 2391.0, 1617.0, 977.0, 679.0, 427.0, 288.0, 166.0, 117.0, 73.0, 52.0, 28.0, 17.0, 13.0, 12.0, 6.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.62451171875, -0.6047134399414062, -0.5849151611328125, -0.5651168823242188, -0.545318603515625, -0.5255203247070312, -0.5057220458984375, -0.48592376708984375, -0.46612548828125, -0.44632720947265625, -0.4265289306640625, -0.40673065185546875, -0.386932373046875, -0.36713409423828125, -0.3473358154296875, -0.32753753662109375, -0.3077392578125, -0.28794097900390625, -0.2681427001953125, -0.24834442138671875, -0.228546142578125, -0.20874786376953125, -0.1889495849609375, -0.16915130615234375, -0.14935302734375, -0.12955474853515625, -0.1097564697265625, -0.08995819091796875, -0.070159912109375, -0.05036163330078125, -0.0305633544921875, -0.01076507568359375, 0.009033203125, 0.02883148193359375, 0.0486297607421875, 0.06842803955078125, 0.088226318359375, 0.10802459716796875, 0.1278228759765625, 0.14762115478515625, 0.16741943359375, 0.18721771240234375, 0.2070159912109375, 0.22681427001953125, 0.246612548828125, 0.26641082763671875, 0.2862091064453125, 0.30600738525390625, 0.3258056640625, 0.34560394287109375, 0.3654022216796875, 0.38520050048828125, 0.404998779296875, 0.42479705810546875, 0.4445953369140625, 0.46439361572265625, 0.48419189453125, 0.5039901733398438, 0.5237884521484375, 0.5435867309570312, 0.563385009765625, 0.5831832885742188, 0.6029815673828125, 0.6227798461914062, 0.642578125]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 6.0, 9.0, 7.0, 8.0, 4.0, 19.0, 19.0, 22.0, 43.0, 35.0, 50.0, 57.0, 73.0, 79.0, 92.0, 112.0, 139.0, 178.0, 207.0, 203.0, 233.0, 233.0, 261.0, 278.0, 234.0, 232.0, 203.0, 162.0, 155.0, 121.0, 99.0, 100.0, 80.0, 63.0, 60.0, 50.0, 34.0, 22.0, 26.0, 12.0, 12.0, 8.0, 8.0, 8.0, 8.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.205810546875, -0.19975662231445312, -0.19370269775390625, -0.18764877319335938, -0.1815948486328125, -0.17554092407226562, -0.16948699951171875, -0.16343307495117188, -0.157379150390625, -0.15132522583007812, -0.14527130126953125, -0.13921737670898438, -0.1331634521484375, -0.12710952758789062, -0.12105560302734375, -0.11500167846679688, -0.10894775390625, -0.10289382934570312, -0.09683990478515625, -0.09078598022460938, -0.0847320556640625, -0.07867813110351562, -0.07262420654296875, -0.06657028198242188, -0.060516357421875, -0.054462432861328125, -0.04840850830078125, -0.042354583740234375, -0.0363006591796875, -0.030246734619140625, -0.02419281005859375, -0.018138885498046875, -0.0120849609375, -0.006031036376953125, 2.288818359375e-05, 0.006076812744140625, 0.0121307373046875, 0.018184661865234375, 0.02423858642578125, 0.030292510986328125, 0.036346435546875, 0.042400360107421875, 0.04845428466796875, 0.054508209228515625, 0.0605621337890625, 0.06661605834960938, 0.07266998291015625, 0.07872390747070312, 0.08477783203125, 0.09083175659179688, 0.09688568115234375, 0.10293960571289062, 0.1089935302734375, 0.11504745483398438, 0.12110137939453125, 0.12715530395507812, 0.133209228515625, 0.13926315307617188, 0.14531707763671875, 0.15137100219726562, 0.1574249267578125, 0.16347885131835938, 0.16953277587890625, 0.17558670043945312, 0.181640625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 0.0, 5.0, 7.0, 5.0, 7.0, 11.0, 15.0, 8.0, 11.0, 25.0, 21.0, 39.0, 34.0, 48.0, 52.0, 72.0, 105.0, 85.0, 89.0, 75.0, 69.0, 40.0, 31.0, 31.0, 26.0, 16.0, 10.0, 17.0, 11.0, 6.0, 6.0, 7.0, 2.0, 7.0, 0.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.6363847851753235, -0.6188454627990723, -0.6013062000274658, -0.5837668776512146, -0.5662275552749634, -0.5486882925033569, -0.5311489701271057, -0.5136096477508545, -0.49607035517692566, -0.4785310626029968, -0.4609917402267456, -0.4434524476528168, -0.42591315507888794, -0.4083738327026367, -0.3908345401287079, -0.37329524755477905, -0.35575592517852783, -0.338216632604599, -0.3206773102283478, -0.30313801765441895, -0.2855986952781677, -0.2680594027042389, -0.25052011013031006, -0.23298080265522003, -0.21544149518013, -0.19790218770503998, -0.18036288022994995, -0.16282358765602112, -0.1452842801809311, -0.12774497270584106, -0.11020567268133163, -0.0926663726568222, -0.0751270055770874, -0.057587701827287674, -0.040048398077487946, -0.022509094327688217, -0.004969790577888489, 0.012569516897201538, 0.030108816921710968, 0.0476481169462204, 0.06518742442131042, 0.08272673189640045, 0.10026603192090988, 0.11780533194541931, 0.13534463942050934, 0.15288394689559937, 0.1704232394695282, 0.18796254694461823, 0.20550185441970825, 0.22304116189479828, 0.2405804693698883, 0.25811976194381714, 0.27565908432006836, 0.2931983768939972, 0.310737669467926, 0.32827699184417725, 0.3458162844181061, 0.3633555769920349, 0.38089489936828613, 0.39843419194221497, 0.4159734845161438, 0.433512806892395, 0.45105209946632385, 0.4685913920402527, 0.4861307144165039]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 5.0, 4.0, 5.0, 8.0, 4.0, 13.0, 12.0, 16.0, 15.0, 21.0, 23.0, 34.0, 24.0, 36.0, 40.0, 43.0, 36.0, 28.0, 42.0, 42.0, 36.0, 37.0, 38.0, 45.0, 39.0, 35.0, 40.0, 35.0, 40.0, 28.0, 23.0, 30.0, 16.0, 20.0, 18.0, 18.0, 17.0, 4.0, 5.0, 9.0, 10.0, 6.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.5176392793655396, -0.5034703016281128, -0.48930129408836365, -0.4751323163509369, -0.46096333861351013, -0.446794331073761, -0.43262535333633423, -0.41845637559890747, -0.4042873978614807, -0.39011842012405396, -0.3759494125843048, -0.36178043484687805, -0.3476114571094513, -0.33344244956970215, -0.3192734718322754, -0.30510449409484863, -0.2909354865550995, -0.27676650881767273, -0.2625975012779236, -0.24842852354049683, -0.23425954580307007, -0.22009055316448212, -0.20592156052589417, -0.1917525827884674, -0.17758359014987946, -0.1634145975112915, -0.14924561977386475, -0.1350766271352768, -0.12090764194726944, -0.10673865675926208, -0.09256966412067413, -0.07840067893266678, -0.06423172354698181, -0.05006273835897446, -0.035893749445676804, -0.02172476053237915, -0.007555775344371796, 0.006613209843635559, 0.02078220248222351, 0.034951187670230865, 0.04912017285823822, 0.06328915804624557, 0.07745814323425293, 0.09162713587284088, 0.10579612106084824, 0.11996510624885559, 0.13413409888744354, 0.1483030915260315, 0.16247206926345825, 0.1766410619020462, 0.19081003963947296, 0.2049790322780609, 0.21914801001548767, 0.23331700265407562, 0.24748599529266357, 0.26165497303009033, 0.2758239507675171, 0.28999292850494385, 0.304161936044693, 0.31833091378211975, 0.3324998915195465, 0.34666889905929565, 0.3608378767967224, 0.37500685453414917, 0.3891758620738983]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 7.0, 6.0, 8.0, 11.0, 16.0, 18.0, 36.0, 47.0, 64.0, 111.0, 154.0, 207.0, 296.0, 436.0, 584.0, 846.0, 1186.0, 1595.0, 2448.0, 3612.0, 5287.0, 7833.0, 11715.0, 18211.0, 28921.0, 46448.0, 79760.0, 140043.0, 234061.0, 189258.0, 107654.0, 61701.0, 37434.0, 23200.0, 14758.0, 9813.0, 6566.0, 4401.0, 2912.0, 2039.0, 1452.0, 1054.0, 681.0, 471.0, 369.0, 247.0, 191.0, 128.0, 87.0, 64.0, 36.0, 29.0, 18.0, 13.0, 9.0, 3.0, 7.0, 2.0, 2.0, 4.0], "bins": [-0.1925048828125, -0.1866302490234375, -0.180755615234375, -0.1748809814453125, -0.16900634765625, -0.1631317138671875, -0.157257080078125, -0.1513824462890625, -0.1455078125, -0.1396331787109375, -0.133758544921875, -0.1278839111328125, -0.12200927734375, -0.1161346435546875, -0.110260009765625, -0.1043853759765625, -0.0985107421875, -0.0926361083984375, -0.086761474609375, -0.0808868408203125, -0.07501220703125, -0.0691375732421875, -0.063262939453125, -0.0573883056640625, -0.051513671875, -0.0456390380859375, -0.039764404296875, -0.0338897705078125, -0.02801513671875, -0.0221405029296875, -0.016265869140625, -0.0103912353515625, -0.0045166015625, 0.0013580322265625, 0.007232666015625, 0.0131072998046875, 0.01898193359375, 0.0248565673828125, 0.030731201171875, 0.0366058349609375, 0.04248046875, 0.0483551025390625, 0.054229736328125, 0.0601043701171875, 0.06597900390625, 0.0718536376953125, 0.077728271484375, 0.0836029052734375, 0.0894775390625, 0.0953521728515625, 0.101226806640625, 0.1071014404296875, 0.11297607421875, 0.1188507080078125, 0.124725341796875, 0.1305999755859375, 0.136474609375, 0.1423492431640625, 0.148223876953125, 0.1540985107421875, 0.15997314453125, 0.1658477783203125, 0.171722412109375, 0.1775970458984375, 0.1834716796875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 8.0, 2.0, 7.0, 7.0, 13.0, 8.0, 12.0, 21.0, 12.0, 24.0, 39.0, 29.0, 26.0, 43.0, 45.0, 37.0, 37.0, 40.0, 42.0, 28.0, 51.0, 41.0, 44.0, 38.0, 57.0, 23.0, 36.0, 27.0, 37.0, 22.0, 25.0, 16.0, 24.0, 22.0, 11.0, 13.0, 10.0, 5.0, 9.0, 10.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.5205078125, -0.5057258605957031, -0.49094390869140625, -0.4761619567871094, -0.4613800048828125, -0.4465980529785156, -0.43181610107421875, -0.4170341491699219, -0.402252197265625, -0.3874702453613281, -0.37268829345703125, -0.3579063415527344, -0.3431243896484375, -0.3283424377441406, -0.31356048583984375, -0.2987785339355469, -0.28399658203125, -0.2692146301269531, -0.25443267822265625, -0.23965072631835938, -0.2248687744140625, -0.21008682250976562, -0.19530487060546875, -0.18052291870117188, -0.165740966796875, -0.15095901489257812, -0.13617706298828125, -0.12139511108398438, -0.1066131591796875, -0.09183120727539062, -0.07704925537109375, -0.062267303466796875, -0.0474853515625, -0.032703399658203125, -0.01792144775390625, -0.003139495849609375, 0.0116424560546875, 0.026424407958984375, 0.04120635986328125, 0.055988311767578125, 0.070770263671875, 0.08555221557617188, 0.10033416748046875, 0.11511611938476562, 0.1298980712890625, 0.14468002319335938, 0.15946197509765625, 0.17424392700195312, 0.18902587890625, 0.20380783081054688, 0.21858978271484375, 0.23337173461914062, 0.2481536865234375, 0.2629356384277344, 0.27771759033203125, 0.2924995422363281, 0.307281494140625, 0.3220634460449219, 0.33684539794921875, 0.3516273498535156, 0.3664093017578125, 0.3811912536621094, 0.39597320556640625, 0.4107551574707031, 0.425537109375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 0.0, 6.0, 8.0, 8.0, 9.0, 9.0, 12.0, 21.0, 18.0, 45.0, 62.0, 73.0, 101.0, 149.0, 160.0, 283.0, 411.0, 466.0, 634.0, 962.0, 1338.0, 1998.0, 2694.0, 4110.0, 6388.0, 11243.0, 21355.0, 48323.0, 141149.0, 480039.0, 201639.0, 63404.0, 25952.0, 13093.0, 7525.0, 4565.0, 3105.0, 2153.0, 1361.0, 976.0, 727.0, 535.0, 365.0, 270.0, 232.0, 155.0, 115.0, 84.0, 61.0, 43.0, 41.0, 29.0, 19.0, 10.0, 13.0, 4.0, 2.0, 7.0, 2.0, 4.0, 3.0], "bins": [-0.326416015625, -0.31641387939453125, -0.3064117431640625, -0.29640960693359375, -0.286407470703125, -0.27640533447265625, -0.2664031982421875, -0.25640106201171875, -0.24639892578125, -0.23639678955078125, -0.2263946533203125, -0.21639251708984375, -0.206390380859375, -0.19638824462890625, -0.1863861083984375, -0.17638397216796875, -0.1663818359375, -0.15637969970703125, -0.1463775634765625, -0.13637542724609375, -0.126373291015625, -0.11637115478515625, -0.1063690185546875, -0.09636688232421875, -0.08636474609375, -0.07636260986328125, -0.0663604736328125, -0.05635833740234375, -0.046356201171875, -0.03635406494140625, -0.0263519287109375, -0.01634979248046875, -0.00634765625, 0.00365447998046875, 0.0136566162109375, 0.02365875244140625, 0.033660888671875, 0.04366302490234375, 0.0536651611328125, 0.06366729736328125, 0.07366943359375, 0.08367156982421875, 0.0936737060546875, 0.10367584228515625, 0.113677978515625, 0.12368011474609375, 0.1336822509765625, 0.14368438720703125, 0.1536865234375, 0.16368865966796875, 0.1736907958984375, 0.18369293212890625, 0.193695068359375, 0.20369720458984375, 0.2136993408203125, 0.22370147705078125, 0.23370361328125, 0.24370574951171875, 0.2537078857421875, 0.26371002197265625, 0.273712158203125, 0.28371429443359375, 0.2937164306640625, 0.30371856689453125, 0.313720703125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 1.0, 1.0, 5.0, 3.0, 10.0, 12.0, 6.0, 16.0, 11.0, 13.0, 23.0, 22.0, 21.0, 17.0, 28.0, 28.0, 23.0, 41.0, 39.0, 28.0, 33.0, 45.0, 41.0, 32.0, 38.0, 52.0, 43.0, 50.0, 38.0, 40.0, 28.0, 23.0, 27.0, 19.0, 20.0, 28.0, 5.0, 16.0, 18.0, 11.0, 12.0, 11.0, 8.0, 1.0, 7.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.25732421875, -0.24888992309570312, -0.24045562744140625, -0.23202133178710938, -0.2235870361328125, -0.21515274047851562, -0.20671844482421875, -0.19828414916992188, -0.189849853515625, -0.18141555786132812, -0.17298126220703125, -0.16454696655273438, -0.1561126708984375, -0.14767837524414062, -0.13924407958984375, -0.13080978393554688, -0.12237548828125, -0.11394119262695312, -0.10550689697265625, -0.09707260131835938, -0.0886383056640625, -0.08020401000976562, -0.07176971435546875, -0.06333541870117188, -0.054901123046875, -0.046466827392578125, -0.03803253173828125, -0.029598236083984375, -0.0211639404296875, -0.012729644775390625, -0.00429534912109375, 0.004138946533203125, 0.0125732421875, 0.021007537841796875, 0.02944183349609375, 0.037876129150390625, 0.0463104248046875, 0.054744720458984375, 0.06317901611328125, 0.07161331176757812, 0.080047607421875, 0.08848190307617188, 0.09691619873046875, 0.10535049438476562, 0.1137847900390625, 0.12221908569335938, 0.13065338134765625, 0.13908767700195312, 0.14752197265625, 0.15595626831054688, 0.16439056396484375, 0.17282485961914062, 0.1812591552734375, 0.18969345092773438, 0.19812774658203125, 0.20656204223632812, 0.214996337890625, 0.22343063354492188, 0.23186492919921875, 0.24029922485351562, 0.2487335205078125, 0.2571678161621094, 0.26560211181640625, 0.2740364074707031, 0.282470703125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 8.0, 6.0, 12.0, 12.0, 22.0, 29.0, 41.0, 54.0, 81.0, 124.0, 159.0, 227.0, 336.0, 458.0, 669.0, 991.0, 1485.0, 2435.0, 3988.0, 6880.0, 13400.0, 30426.0, 95080.0, 658071.0, 155313.0, 40453.0, 16595.0, 8310.0, 4685.0, 2879.0, 1719.0, 1098.0, 758.0, 530.0, 372.0, 227.0, 167.0, 119.0, 80.0, 67.0, 59.0, 44.0, 29.0, 16.0, 13.0, 12.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.04766845703125, -0.04616212844848633, -0.044655799865722656, -0.043149471282958984, -0.04164314270019531, -0.04013681411743164, -0.03863048553466797, -0.0371241569519043, -0.035617828369140625, -0.03411149978637695, -0.03260517120361328, -0.03109884262084961, -0.029592514038085938, -0.028086185455322266, -0.026579856872558594, -0.025073528289794922, -0.02356719970703125, -0.022060871124267578, -0.020554542541503906, -0.019048213958740234, -0.017541885375976562, -0.01603555679321289, -0.014529228210449219, -0.013022899627685547, -0.011516571044921875, -0.010010242462158203, -0.008503913879394531, -0.006997585296630859, -0.0054912567138671875, -0.003984928131103516, -0.0024785995483398438, -0.0009722709655761719, 0.0005340576171875, 0.002040386199951172, 0.0035467147827148438, 0.005053043365478516, 0.0065593719482421875, 0.00806570053100586, 0.009572029113769531, 0.011078357696533203, 0.012584686279296875, 0.014091014862060547, 0.015597343444824219, 0.01710367202758789, 0.018610000610351562, 0.020116329193115234, 0.021622657775878906, 0.023128986358642578, 0.02463531494140625, 0.026141643524169922, 0.027647972106933594, 0.029154300689697266, 0.030660629272460938, 0.03216695785522461, 0.03367328643798828, 0.03517961502075195, 0.036685943603515625, 0.0381922721862793, 0.03969860076904297, 0.04120492935180664, 0.04271125793457031, 0.044217586517333984, 0.045723915100097656, 0.04723024368286133, 0.048736572265625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 2.0, 4.0, 2.0, 7.0, 3.0, 7.0, 16.0, 4.0, 25.0, 20.0, 22.0, 56.0, 37.0, 83.0, 62.0, 45.0, 134.0, 88.0, 104.0, 50.0, 57.0, 24.0, 26.0, 32.0, 9.0, 23.0, 13.0, 4.0, 8.0, 6.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.7418136596679688e-06, -2.6579946279525757e-06, -2.5741755962371826e-06, -2.4903565645217896e-06, -2.4065375328063965e-06, -2.3227185010910034e-06, -2.2388994693756104e-06, -2.1550804376602173e-06, -2.0712614059448242e-06, -1.987442374229431e-06, -1.903623342514038e-06, -1.819804310798645e-06, -1.735985279083252e-06, -1.6521662473678589e-06, -1.5683472156524658e-06, -1.4845281839370728e-06, -1.4007091522216797e-06, -1.3168901205062866e-06, -1.2330710887908936e-06, -1.1492520570755005e-06, -1.0654330253601074e-06, -9.816139936447144e-07, -8.977949619293213e-07, -8.139759302139282e-07, -7.301568984985352e-07, -6.463378667831421e-07, -5.62518835067749e-07, -4.78699803352356e-07, -3.948807716369629e-07, -3.110617399215698e-07, -2.2724270820617676e-07, -1.434236764907837e-07, -5.960464477539063e-08, 2.421438694000244e-08, 1.0803341865539551e-07, 1.9185245037078857e-07, 2.7567148208618164e-07, 3.594905138015747e-07, 4.4330954551696777e-07, 5.271285772323608e-07, 6.109476089477539e-07, 6.94766640663147e-07, 7.7858567237854e-07, 8.624047040939331e-07, 9.462237358093262e-07, 1.0300427675247192e-06, 1.1138617992401123e-06, 1.1976808309555054e-06, 1.2814998626708984e-06, 1.3653188943862915e-06, 1.4491379261016846e-06, 1.5329569578170776e-06, 1.6167759895324707e-06, 1.7005950212478638e-06, 1.7844140529632568e-06, 1.86823308467865e-06, 1.952052116394043e-06, 2.035871148109436e-06, 2.119690179824829e-06, 2.203509211540222e-06, 2.2873282432556152e-06, 2.3711472749710083e-06, 2.4549663066864014e-06, 2.5387853384017944e-06, 2.6226043701171875e-06]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 5.0, 1.0, 4.0, 12.0, 12.0, 17.0, 29.0, 52.0, 67.0, 83.0, 115.0, 160.0, 252.0, 359.0, 553.0, 748.0, 1052.0, 1442.0, 2166.0, 3136.0, 4982.0, 7489.0, 11921.0, 20809.0, 38225.0, 81994.0, 311763.0, 374340.0, 88709.0, 40148.0, 21861.0, 12686.0, 7722.0, 4989.0, 3330.0, 2233.0, 1501.0, 1076.0, 777.0, 522.0, 357.0, 233.0, 192.0, 134.0, 91.0, 69.0, 52.0, 26.0, 20.0, 22.0, 13.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.038726806640625, -0.03755474090576172, -0.03638267517089844, -0.035210609436035156, -0.034038543701171875, -0.032866477966308594, -0.03169441223144531, -0.03052234649658203, -0.02935028076171875, -0.02817821502685547, -0.027006149291992188, -0.025834083557128906, -0.024662017822265625, -0.023489952087402344, -0.022317886352539062, -0.02114582061767578, -0.0199737548828125, -0.01880168914794922, -0.017629623413085938, -0.016457557678222656, -0.015285491943359375, -0.014113426208496094, -0.012941360473632812, -0.011769294738769531, -0.01059722900390625, -0.009425163269042969, -0.008253097534179688, -0.007081031799316406, -0.005908966064453125, -0.004736900329589844, -0.0035648345947265625, -0.0023927688598632812, -0.001220703125, -4.863739013671875e-05, 0.0011234283447265625, 0.0022954940795898438, 0.003467559814453125, 0.004639625549316406, 0.0058116912841796875, 0.006983757019042969, 0.00815582275390625, 0.009327888488769531, 0.010499954223632812, 0.011672019958496094, 0.012844085693359375, 0.014016151428222656, 0.015188217163085938, 0.01636028289794922, 0.0175323486328125, 0.01870441436767578, 0.019876480102539062, 0.021048545837402344, 0.022220611572265625, 0.023392677307128906, 0.024564743041992188, 0.02573680877685547, 0.02690887451171875, 0.02808094024658203, 0.029253005981445312, 0.030425071716308594, 0.031597137451171875, 0.032769203186035156, 0.03394126892089844, 0.03511333465576172, 0.036285400390625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 9.0, 7.0, 9.0, 5.0, 11.0, 10.0, 14.0, 11.0, 12.0, 19.0, 24.0, 33.0, 47.0, 55.0, 86.0, 104.0, 136.0, 100.0, 80.0, 51.0, 39.0, 21.0, 18.0, 13.0, 13.0, 11.0, 12.0, 10.0, 7.0, 6.0, 3.0, 6.0, 1.0, 3.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0085601806640625, -0.00827789306640625, -0.00799560546875, -0.00771331787109375, -0.0074310302734375, -0.00714874267578125, -0.006866455078125, -0.00658416748046875, -0.0063018798828125, -0.00601959228515625, -0.0057373046875, -0.00545501708984375, -0.0051727294921875, -0.00489044189453125, -0.004608154296875, -0.00432586669921875, -0.0040435791015625, -0.00376129150390625, -0.00347900390625, -0.00319671630859375, -0.0029144287109375, -0.00263214111328125, -0.002349853515625, -0.00206756591796875, -0.0017852783203125, -0.00150299072265625, -0.001220703125, -0.00093841552734375, -0.0006561279296875, -0.00037384033203125, -9.1552734375e-05, 0.00019073486328125, 0.0004730224609375, 0.00075531005859375, 0.00103759765625, 0.00131988525390625, 0.0016021728515625, 0.00188446044921875, 0.002166748046875, 0.00244903564453125, 0.0027313232421875, 0.00301361083984375, 0.0032958984375, 0.00357818603515625, 0.0038604736328125, 0.00414276123046875, 0.004425048828125, 0.00470733642578125, 0.0049896240234375, 0.00527191162109375, 0.00555419921875, 0.00583648681640625, 0.0061187744140625, 0.00640106201171875, 0.006683349609375, 0.00696563720703125, 0.0072479248046875, 0.00753021240234375, 0.0078125, 0.00809478759765625, 0.0083770751953125, 0.00865936279296875, 0.008941650390625, 0.00922393798828125, 0.0095062255859375]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 2.0, 1.0, 7.0, 6.0, 7.0, 12.0, 8.0, 14.0, 15.0, 23.0, 24.0, 39.0, 31.0, 46.0, 56.0, 91.0, 91.0, 86.0, 103.0, 73.0, 53.0, 41.0, 33.0, 27.0, 21.0, 16.0, 14.0, 17.0, 10.0, 5.0, 8.0, 6.0, 2.0, 3.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.6510952115058899, -0.6335471272468567, -0.6159989833831787, -0.5984508991241455, -0.5809028148651123, -0.5633546710014343, -0.5458065867424011, -0.5282585024833679, -0.5107103586196899, -0.49316224455833435, -0.47561416029930115, -0.45806604623794556, -0.44051793217658997, -0.4229698181152344, -0.40542173385620117, -0.3878736197948456, -0.3703255355358124, -0.3527774214744568, -0.3352293372154236, -0.317681223154068, -0.3001331090927124, -0.2825850248336792, -0.2650369107723236, -0.24748879671096802, -0.22994069755077362, -0.21239259839057922, -0.19484448432922363, -0.17729638516902924, -0.15974828600883484, -0.14220017194747925, -0.12465207278728485, -0.10710396617650986, -0.08955585956573486, -0.07200775295495987, -0.054459650069475174, -0.03691154718399048, -0.019363440573215485, -0.0018153339624404907, 0.015732765197753906, 0.0332808718085289, 0.050828978419303894, 0.06837708503007889, 0.08592519164085388, 0.10347329080104828, 0.12102139741182327, 0.13856950402259827, 0.15611760318279266, 0.17366570234298706, 0.19121381640434265, 0.20876191556453705, 0.22631002962589264, 0.24385812878608704, 0.2614062428474426, 0.27895432710647583, 0.2965024411678314, 0.314050555229187, 0.3315986394882202, 0.3491467535495758, 0.366694837808609, 0.3842429518699646, 0.4017910659313202, 0.4193391799926758, 0.436887264251709, 0.4544353783130646, 0.47198349237442017]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 5.0, 5.0, 3.0, 8.0, 6.0, 13.0, 14.0, 15.0, 14.0, 19.0, 27.0, 31.0, 25.0, 38.0, 40.0, 42.0, 33.0, 32.0, 43.0, 41.0, 34.0, 38.0, 37.0, 46.0, 44.0, 27.0, 43.0, 33.0, 41.0, 29.0, 21.0, 30.0, 15.0, 20.0, 19.0, 17.0, 18.0, 4.0, 6.0, 8.0, 10.0, 6.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.5081380009651184, -0.4941581189632416, -0.48017823696136475, -0.4661983549594879, -0.4522184729576111, -0.43823862075805664, -0.4242587387561798, -0.410278856754303, -0.39629897475242615, -0.3823190927505493, -0.3683392107486725, -0.35435932874679565, -0.3403794765472412, -0.326399564743042, -0.31241971254348755, -0.2984398305416107, -0.2844599485397339, -0.27048006653785706, -0.2565001845359802, -0.2425203174352646, -0.22854043543338776, -0.21456055343151093, -0.2005806863307953, -0.18660080432891846, -0.17262092232704163, -0.1586410403251648, -0.14466115832328796, -0.13068129122257233, -0.1167014092206955, -0.10272152721881866, -0.08874165266752243, -0.0747617781162262, -0.06078192591667175, -0.04680204764008522, -0.03282216936349869, -0.018842291086912155, -0.0048624128103256226, 0.009117469191551208, 0.023097343742847443, 0.03707721829414368, 0.05105710029602051, 0.06503698229789734, 0.07901685684919357, 0.09299673140048981, 0.10697661340236664, 0.12095649540424347, 0.1349363625049591, 0.14891624450683594, 0.16289612650871277, 0.1768760085105896, 0.19085589051246643, 0.20483575761318207, 0.2188156396150589, 0.23279552161693573, 0.24677538871765137, 0.2607552707195282, 0.27473515272140503, 0.28871503472328186, 0.3026949167251587, 0.3166747987270355, 0.33065468072891235, 0.3446345329284668, 0.35861441493034363, 0.37259429693222046, 0.3865741789340973]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 11.0, 12.0, 14.0, 28.0, 33.0, 47.0, 89.0, 122.0, 166.0, 278.0, 385.0, 557.0, 815.0, 1261.0, 2031.0, 3134.0, 4825.0, 7668.0, 12762.0, 20819.0, 35609.0, 62904.0, 116523.0, 221774.0, 247346.0, 134913.0, 72246.0, 40567.0, 23761.0, 13901.0, 8765.0, 5470.0, 3328.0, 2202.0, 1450.0, 933.0, 596.0, 396.0, 259.0, 191.0, 120.0, 94.0, 57.0, 32.0, 22.0, 23.0, 12.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.71337890625, -0.6896896362304688, -0.6660003662109375, -0.6423110961914062, -0.618621826171875, -0.5949325561523438, -0.5712432861328125, -0.5475540161132812, -0.52386474609375, -0.5001754760742188, -0.4764862060546875, -0.45279693603515625, -0.429107666015625, -0.40541839599609375, -0.3817291259765625, -0.35803985595703125, -0.3343505859375, -0.31066131591796875, -0.2869720458984375, -0.26328277587890625, -0.239593505859375, -0.21590423583984375, -0.1922149658203125, -0.16852569580078125, -0.14483642578125, -0.12114715576171875, -0.0974578857421875, -0.07376861572265625, -0.050079345703125, -0.02639007568359375, -0.0027008056640625, 0.02098846435546875, 0.044677734375, 0.06836700439453125, 0.0920562744140625, 0.11574554443359375, 0.139434814453125, 0.16312408447265625, 0.1868133544921875, 0.21050262451171875, 0.23419189453125, 0.25788116455078125, 0.2815704345703125, 0.30525970458984375, 0.328948974609375, 0.35263824462890625, 0.3763275146484375, 0.40001678466796875, 0.4237060546875, 0.44739532470703125, 0.4710845947265625, 0.49477386474609375, 0.518463134765625, 0.5421524047851562, 0.5658416748046875, 0.5895309448242188, 0.61322021484375, 0.6369094848632812, 0.6605987548828125, 0.6842880249023438, 0.707977294921875, 0.7316665649414062, 0.7553558349609375, 0.7790451049804688, 0.802734375]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 6.0, 4.0, 2.0, 6.0, 9.0, 12.0, 8.0, 21.0, 18.0, 23.0, 22.0, 27.0, 29.0, 37.0, 31.0, 41.0, 34.0, 42.0, 47.0, 36.0, 31.0, 30.0, 47.0, 47.0, 41.0, 30.0, 45.0, 25.0, 37.0, 26.0, 23.0, 22.0, 32.0, 19.0, 15.0, 12.0, 12.0, 17.0, 11.0, 7.0, 4.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.447265625, -0.4349365234375, -0.422607421875, -0.4102783203125, -0.39794921875, -0.3856201171875, -0.373291015625, -0.3609619140625, -0.3486328125, -0.3363037109375, -0.323974609375, -0.3116455078125, -0.29931640625, -0.2869873046875, -0.274658203125, -0.2623291015625, -0.25, -0.2376708984375, -0.225341796875, -0.2130126953125, -0.20068359375, -0.1883544921875, -0.176025390625, -0.1636962890625, -0.1513671875, -0.1390380859375, -0.126708984375, -0.1143798828125, -0.10205078125, -0.0897216796875, -0.077392578125, -0.0650634765625, -0.052734375, -0.0404052734375, -0.028076171875, -0.0157470703125, -0.00341796875, 0.0089111328125, 0.021240234375, 0.0335693359375, 0.0458984375, 0.0582275390625, 0.070556640625, 0.0828857421875, 0.09521484375, 0.1075439453125, 0.119873046875, 0.1322021484375, 0.14453125, 0.1568603515625, 0.169189453125, 0.1815185546875, 0.19384765625, 0.2061767578125, 0.218505859375, 0.2308349609375, 0.2431640625, 0.2554931640625, 0.267822265625, 0.2801513671875, 0.29248046875, 0.3048095703125, 0.317138671875, 0.3294677734375, 0.341796875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 3.0, 13.0, 15.0, 26.0, 40.0, 55.0, 68.0, 127.0, 137.0, 226.0, 298.0, 510.0, 778.0, 1234.0, 1978.0, 3400.0, 5638.0, 9842.0, 16503.0, 29079.0, 52860.0, 100364.0, 207865.0, 300773.0, 147034.0, 74811.0, 40268.0, 22329.0, 12907.0, 7627.0, 4586.0, 2699.0, 1590.0, 943.0, 619.0, 387.0, 303.0, 198.0, 124.0, 100.0, 56.0, 37.0, 32.0, 19.0, 11.0, 20.0, 4.0, 4.0, 5.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.80419921875, -0.7792816162109375, -0.754364013671875, -0.7294464111328125, -0.70452880859375, -0.6796112060546875, -0.654693603515625, -0.6297760009765625, -0.6048583984375, -0.5799407958984375, -0.555023193359375, -0.5301055908203125, -0.50518798828125, -0.4802703857421875, -0.455352783203125, -0.4304351806640625, -0.405517578125, -0.3805999755859375, -0.355682373046875, -0.3307647705078125, -0.30584716796875, -0.2809295654296875, -0.256011962890625, -0.2310943603515625, -0.2061767578125, -0.1812591552734375, -0.156341552734375, -0.1314239501953125, -0.10650634765625, -0.0815887451171875, -0.056671142578125, -0.0317535400390625, -0.0068359375, 0.0180816650390625, 0.042999267578125, 0.0679168701171875, 0.09283447265625, 0.1177520751953125, 0.142669677734375, 0.1675872802734375, 0.1925048828125, 0.2174224853515625, 0.242340087890625, 0.2672576904296875, 0.29217529296875, 0.3170928955078125, 0.342010498046875, 0.3669281005859375, 0.391845703125, 0.4167633056640625, 0.441680908203125, 0.4665985107421875, 0.49151611328125, 0.5164337158203125, 0.541351318359375, 0.5662689208984375, 0.5911865234375, 0.6161041259765625, 0.641021728515625, 0.6659393310546875, 0.69085693359375, 0.7157745361328125, 0.740692138671875, 0.7656097412109375, 0.79052734375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 3.0, 3.0, 5.0, 3.0, 6.0, 12.0, 10.0, 16.0, 19.0, 15.0, 30.0, 18.0, 29.0, 32.0, 32.0, 36.0, 30.0, 33.0, 42.0, 51.0, 49.0, 34.0, 45.0, 47.0, 31.0, 49.0, 42.0, 33.0, 32.0, 27.0, 26.0, 33.0, 27.0, 14.0, 12.0, 14.0, 13.0, 16.0, 5.0, 7.0, 11.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.269775390625, -0.26175498962402344, -0.2537345886230469, -0.2457141876220703, -0.23769378662109375, -0.2296733856201172, -0.22165298461914062, -0.21363258361816406, -0.2056121826171875, -0.19759178161621094, -0.18957138061523438, -0.1815509796142578, -0.17353057861328125, -0.1655101776123047, -0.15748977661132812, -0.14946937561035156, -0.141448974609375, -0.13342857360839844, -0.12540817260742188, -0.11738777160644531, -0.10936737060546875, -0.10134696960449219, -0.09332656860351562, -0.08530616760253906, -0.0772857666015625, -0.06926536560058594, -0.061244964599609375, -0.05322456359863281, -0.04520416259765625, -0.03718376159667969, -0.029163360595703125, -0.021142959594726562, -0.01312255859375, -0.0051021575927734375, 0.002918243408203125, 0.010938644409179688, 0.01895904541015625, 0.026979446411132812, 0.034999847412109375, 0.04302024841308594, 0.0510406494140625, 0.05906105041503906, 0.06708145141601562, 0.07510185241699219, 0.08312225341796875, 0.09114265441894531, 0.09916305541992188, 0.10718345642089844, 0.115203857421875, 0.12322425842285156, 0.13124465942382812, 0.1392650604248047, 0.14728546142578125, 0.1553058624267578, 0.16332626342773438, 0.17134666442871094, 0.1793670654296875, 0.18738746643066406, 0.19540786743164062, 0.2034282684326172, 0.21144866943359375, 0.2194690704345703, 0.22748947143554688, 0.23550987243652344, 0.2435302734375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 5.0, 1.0, 12.0, 11.0, 22.0, 18.0, 34.0, 47.0, 52.0, 91.0, 133.0, 209.0, 322.0, 516.0, 854.0, 1353.0, 2305.0, 3723.0, 6511.0, 11689.0, 22311.0, 48534.0, 215365.0, 624901.0, 55186.0, 24211.0, 12634.0, 6984.0, 4091.0, 2422.0, 1471.0, 940.0, 545.0, 360.0, 217.0, 153.0, 98.0, 61.0, 47.0, 34.0, 18.0, 21.0, 13.0, 7.0, 9.0, 1.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.68115234375, -0.6617279052734375, -0.642303466796875, -0.6228790283203125, -0.60345458984375, -0.5840301513671875, -0.564605712890625, -0.5451812744140625, -0.5257568359375, -0.5063323974609375, -0.486907958984375, -0.4674835205078125, -0.44805908203125, -0.4286346435546875, -0.409210205078125, -0.3897857666015625, -0.370361328125, -0.3509368896484375, -0.331512451171875, -0.3120880126953125, -0.29266357421875, -0.2732391357421875, -0.253814697265625, -0.2343902587890625, -0.2149658203125, -0.1955413818359375, -0.176116943359375, -0.1566925048828125, -0.13726806640625, -0.1178436279296875, -0.098419189453125, -0.0789947509765625, -0.0595703125, -0.0401458740234375, -0.020721435546875, -0.0012969970703125, 0.01812744140625, 0.0375518798828125, 0.056976318359375, 0.0764007568359375, 0.0958251953125, 0.1152496337890625, 0.134674072265625, 0.1540985107421875, 0.17352294921875, 0.1929473876953125, 0.212371826171875, 0.2317962646484375, 0.251220703125, 0.2706451416015625, 0.290069580078125, 0.3094940185546875, 0.32891845703125, 0.3483428955078125, 0.367767333984375, 0.3871917724609375, 0.4066162109375, 0.4260406494140625, 0.445465087890625, 0.4648895263671875, 0.48431396484375, 0.5037384033203125, 0.523162841796875, 0.5425872802734375, 0.56201171875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0, 8.0, 1.0, 9.0, 8.0, 12.0, 13.0, 18.0, 24.0, 29.0, 59.0, 134.0, 311.0, 139.0, 47.0, 34.0, 33.0, 24.0, 12.0, 12.0, 9.0, 5.0, 4.0, 7.0, 9.0, 1.0, 4.0, 4.0, 4.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3113021850585938e-05, -1.2696720659732819e-05, -1.22804194688797e-05, -1.186411827802658e-05, -1.1447817087173462e-05, -1.1031515896320343e-05, -1.0615214705467224e-05, -1.0198913514614105e-05, -9.782612323760986e-06, -9.366311132907867e-06, -8.950009942054749e-06, -8.53370875120163e-06, -8.11740756034851e-06, -7.701106369495392e-06, -7.284805178642273e-06, -6.868503987789154e-06, -6.452202796936035e-06, -6.035901606082916e-06, -5.619600415229797e-06, -5.2032992243766785e-06, -4.7869980335235596e-06, -4.370696842670441e-06, -3.954395651817322e-06, -3.538094460964203e-06, -3.121793270111084e-06, -2.705492079257965e-06, -2.289190888404846e-06, -1.8728896975517273e-06, -1.4565885066986084e-06, -1.0402873158454895e-06, -6.239861249923706e-07, -2.076849341392517e-07, 2.086162567138672e-07, 6.249174475669861e-07, 1.041218638420105e-06, 1.4575198292732239e-06, 1.8738210201263428e-06, 2.2901222109794617e-06, 2.7064234018325806e-06, 3.1227245926856995e-06, 3.5390257835388184e-06, 3.955326974391937e-06, 4.371628165245056e-06, 4.787929356098175e-06, 5.204230546951294e-06, 5.620531737804413e-06, 6.036832928657532e-06, 6.453134119510651e-06, 6.8694353103637695e-06, 7.2857365012168884e-06, 7.702037692070007e-06, 8.118338882923126e-06, 8.534640073776245e-06, 8.950941264629364e-06, 9.367242455482483e-06, 9.783543646335602e-06, 1.019984483718872e-05, 1.061614602804184e-05, 1.1032447218894958e-05, 1.1448748409748077e-05, 1.1865049600601196e-05, 1.2281350791454315e-05, 1.2697651982307434e-05, 1.3113953173160553e-05, 1.3530254364013672e-05]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 9.0, 5.0, 10.0, 15.0, 16.0, 22.0, 38.0, 62.0, 75.0, 109.0, 146.0, 208.0, 292.0, 429.0, 646.0, 966.0, 1471.0, 2375.0, 4074.0, 7573.0, 15610.0, 36040.0, 120232.0, 747999.0, 61375.0, 23504.0, 10890.0, 5599.0, 3128.0, 1944.0, 1206.0, 750.0, 541.0, 345.0, 235.0, 182.0, 137.0, 90.0, 53.0, 45.0, 33.0, 26.0, 19.0, 13.0, 6.0, 4.0, 7.0, 6.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74853515625, -0.7229537963867188, -0.6973724365234375, -0.6717910766601562, -0.646209716796875, -0.6206283569335938, -0.5950469970703125, -0.5694656372070312, -0.54388427734375, -0.5183029174804688, -0.4927215576171875, -0.46714019775390625, -0.441558837890625, -0.41597747802734375, -0.3903961181640625, -0.36481475830078125, -0.3392333984375, -0.31365203857421875, -0.2880706787109375, -0.26248931884765625, -0.236907958984375, -0.21132659912109375, -0.1857452392578125, -0.16016387939453125, -0.13458251953125, -0.10900115966796875, -0.0834197998046875, -0.05783843994140625, -0.032257080078125, -0.00667572021484375, 0.0189056396484375, 0.04448699951171875, 0.070068359375, 0.09564971923828125, 0.1212310791015625, 0.14681243896484375, 0.172393798828125, 0.19797515869140625, 0.2235565185546875, 0.24913787841796875, 0.27471923828125, 0.30030059814453125, 0.3258819580078125, 0.35146331787109375, 0.377044677734375, 0.40262603759765625, 0.4282073974609375, 0.45378875732421875, 0.4793701171875, 0.5049514770507812, 0.5305328369140625, 0.5561141967773438, 0.581695556640625, 0.6072769165039062, 0.6328582763671875, 0.6584396362304688, 0.68402099609375, 0.7096023559570312, 0.7351837158203125, 0.7607650756835938, 0.786346435546875, 0.8119277954101562, 0.8375091552734375, 0.8630905151367188, 0.888671875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 3.0, 8.0, 6.0, 8.0, 20.0, 19.0, 18.0, 20.0, 42.0, 51.0, 82.0, 447.0, 75.0, 27.0, 34.0, 28.0, 30.0, 16.0, 12.0, 10.0, 7.0, 5.0, 6.0, 2.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.271484375, -0.26459312438964844, -0.2577018737792969, -0.2508106231689453, -0.24391937255859375, -0.2370281219482422, -0.23013687133789062, -0.22324562072753906, -0.2163543701171875, -0.20946311950683594, -0.20257186889648438, -0.1956806182861328, -0.18878936767578125, -0.1818981170654297, -0.17500686645507812, -0.16811561584472656, -0.161224365234375, -0.15433311462402344, -0.14744186401367188, -0.1405506134033203, -0.13365936279296875, -0.1267681121826172, -0.11987686157226562, -0.11298561096191406, -0.1060943603515625, -0.09920310974121094, -0.09231185913085938, -0.08542060852050781, -0.07852935791015625, -0.07163810729980469, -0.06474685668945312, -0.05785560607910156, -0.05096435546875, -0.04407310485839844, -0.037181854248046875, -0.030290603637695312, -0.02339935302734375, -0.016508102416992188, -0.009616851806640625, -0.0027256011962890625, 0.0041656494140625, 0.011056900024414062, 0.017948150634765625, 0.024839401245117188, 0.03173065185546875, 0.03862190246582031, 0.045513153076171875, 0.05240440368652344, 0.059295654296875, 0.06618690490722656, 0.07307815551757812, 0.07996940612792969, 0.08686065673828125, 0.09375190734863281, 0.10064315795898438, 0.10753440856933594, 0.1144256591796875, 0.12131690979003906, 0.12820816040039062, 0.1350994110107422, 0.14199066162109375, 0.1488819122314453, 0.15577316284179688, 0.16266441345214844, 0.1695556640625]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 5.0, 4.0, 8.0, 5.0, 10.0, 10.0, 15.0, 19.0, 27.0, 12.0, 32.0, 47.0, 46.0, 61.0, 78.0, 101.0, 101.0, 92.0, 78.0, 54.0, 38.0, 35.0, 20.0, 21.0, 11.0, 16.0, 12.0, 6.0, 3.0, 5.0, 10.0, 7.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.6138788461685181, -0.5967633724212646, -0.5796478986740112, -0.562532365322113, -0.5454168915748596, -0.5283014178276062, -0.5111859440803528, -0.49407047033309937, -0.47695496678352356, -0.45983949303627014, -0.44272398948669434, -0.4256085157394409, -0.4084930419921875, -0.3913775384426117, -0.3742620646953583, -0.35714656114578247, -0.34003108739852905, -0.32291561365127563, -0.30580011010169983, -0.2886846363544464, -0.2715691328048706, -0.2544536590576172, -0.23733818531036377, -0.22022269666194916, -0.20310720801353455, -0.18599171936511993, -0.16887623071670532, -0.1517607569694519, -0.1346452683210373, -0.11752977967262268, -0.10041429847478867, -0.08329881727695465, -0.06618332862854004, -0.049067843705415726, -0.03195235878229141, -0.014836873859167099, 0.0022786110639572144, 0.019394099712371826, 0.03650958091020584, 0.053625062108039856, 0.07074055075645447, 0.08785603940486908, 0.1049715206027031, 0.12208700180053711, 0.13920249044895172, 0.15631797909736633, 0.17343345284461975, 0.19054894149303436, 0.20766443014144897, 0.2247799187898636, 0.2418954074382782, 0.2590108811855316, 0.2761263847351074, 0.29324185848236084, 0.31035733222961426, 0.3274728059768677, 0.3445883095264435, 0.3617037832736969, 0.3788192868232727, 0.3959347605705261, 0.41305023431777954, 0.43016573786735535, 0.44728121161460876, 0.46439671516418457, 0.481512188911438]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 5.0, 5.0, 5.0, 9.0, 9.0, 21.0, 17.0, 16.0, 18.0, 29.0, 34.0, 32.0, 34.0, 33.0, 40.0, 40.0, 45.0, 37.0, 44.0, 51.0, 39.0, 42.0, 50.0, 35.0, 22.0, 31.0, 32.0, 25.0, 27.0, 29.0, 22.0, 26.0, 16.0, 13.0, 14.0, 15.0, 7.0, 7.0, 11.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.4291985034942627, -0.4158165454864502, -0.4024345874786377, -0.3890526294708252, -0.3756707012653351, -0.3622887432575226, -0.3489067852497101, -0.3355248272418976, -0.3221428692340851, -0.3087609112262726, -0.2953789532184601, -0.28199702501296997, -0.26861506700515747, -0.25523310899734497, -0.24185115098953247, -0.22846919298171997, -0.21508724987506866, -0.20170529186725616, -0.18832334876060486, -0.17494139075279236, -0.16155943274497986, -0.14817747473716736, -0.13479553163051605, -0.12141357362270355, -0.10803162306547165, -0.09464967250823975, -0.08126771450042725, -0.06788576394319534, -0.05450380966067314, -0.04112185537815094, -0.027739904820919037, -0.014357946813106537, -0.0009759962558746338, 0.012405957095324993, 0.02578791044652462, 0.03916986286640167, 0.052551817148923874, 0.06593377143144608, 0.07931572198867798, 0.09269767999649048, 0.10607963055372238, 0.11946158111095428, 0.13284353911876678, 0.1462254822254181, 0.1596074402332306, 0.1729893982410431, 0.1863713562488556, 0.1997533142566681, 0.2131352573633194, 0.2265172153711319, 0.2398991584777832, 0.2532811164855957, 0.2666630744934082, 0.2800450325012207, 0.2934269905090332, 0.3068089485168457, 0.3201908767223358, 0.3335728347301483, 0.3469547927379608, 0.3603367209434509, 0.3737186789512634, 0.3871006369590759, 0.4004825949668884, 0.4138645529747009, 0.4272465109825134]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 15.0, 18.0, 31.0, 41.0, 72.0, 85.0, 142.0, 207.0, 324.0, 505.0, 796.0, 1128.0, 1747.0, 2710.0, 4239.0, 6626.0, 10439.0, 16879.0, 27205.0, 46829.0, 81605.0, 155142.0, 355946.0, 1188933.0, 1447499.0, 430165.0, 178108.0, 94034.0, 53697.0, 32241.0, 20032.0, 12466.0, 8162.0, 5385.0, 3503.0, 2366.0, 1553.0, 1069.0, 769.0, 509.0, 334.0, 228.0, 169.0, 107.0, 70.0, 57.0, 37.0, 18.0, 20.0, 9.0, 7.0, 4.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.51708984375, -0.5009841918945312, -0.4848785400390625, -0.46877288818359375, -0.452667236328125, -0.43656158447265625, -0.4204559326171875, -0.40435028076171875, -0.38824462890625, -0.37213897705078125, -0.3560333251953125, -0.33992767333984375, -0.323822021484375, -0.30771636962890625, -0.2916107177734375, -0.27550506591796875, -0.2593994140625, -0.24329376220703125, -0.2271881103515625, -0.21108245849609375, -0.194976806640625, -0.17887115478515625, -0.1627655029296875, -0.14665985107421875, -0.13055419921875, -0.11444854736328125, -0.0983428955078125, -0.08223724365234375, -0.066131591796875, -0.05002593994140625, -0.0339202880859375, -0.01781463623046875, -0.001708984375, 0.01439666748046875, 0.0305023193359375, 0.04660797119140625, 0.062713623046875, 0.07881927490234375, 0.0949249267578125, 0.11103057861328125, 0.12713623046875, 0.14324188232421875, 0.1593475341796875, 0.17545318603515625, 0.191558837890625, 0.20766448974609375, 0.2237701416015625, 0.23987579345703125, 0.2559814453125, 0.27208709716796875, 0.2881927490234375, 0.30429840087890625, 0.320404052734375, 0.33650970458984375, 0.3526153564453125, 0.36872100830078125, 0.38482666015625, 0.40093231201171875, 0.4170379638671875, 0.43314361572265625, 0.449249267578125, 0.46535491943359375, 0.4814605712890625, 0.49756622314453125, 0.513671875]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 2.0, 2.0, 7.0, 7.0, 7.0, 15.0, 12.0, 12.0, 19.0, 13.0, 25.0, 38.0, 35.0, 28.0, 22.0, 35.0, 39.0, 42.0, 50.0, 39.0, 50.0, 43.0, 37.0, 42.0, 47.0, 33.0, 27.0, 26.0, 31.0, 22.0, 23.0, 35.0, 28.0, 16.0, 22.0, 10.0, 13.0, 11.0, 7.0, 8.0, 6.0, 6.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.2587890625, -0.2507781982421875, -0.242767333984375, -0.2347564697265625, -0.22674560546875, -0.2187347412109375, -0.210723876953125, -0.2027130126953125, -0.1947021484375, -0.1866912841796875, -0.178680419921875, -0.1706695556640625, -0.16265869140625, -0.1546478271484375, -0.146636962890625, -0.1386260986328125, -0.130615234375, -0.1226043701171875, -0.114593505859375, -0.1065826416015625, -0.09857177734375, -0.0905609130859375, -0.082550048828125, -0.0745391845703125, -0.0665283203125, -0.0585174560546875, -0.050506591796875, -0.0424957275390625, -0.03448486328125, -0.0264739990234375, -0.018463134765625, -0.0104522705078125, -0.00244140625, 0.0055694580078125, 0.013580322265625, 0.0215911865234375, 0.02960205078125, 0.0376129150390625, 0.045623779296875, 0.0536346435546875, 0.0616455078125, 0.0696563720703125, 0.077667236328125, 0.0856781005859375, 0.09368896484375, 0.1016998291015625, 0.109710693359375, 0.1177215576171875, 0.125732421875, 0.1337432861328125, 0.141754150390625, 0.1497650146484375, 0.15777587890625, 0.1657867431640625, 0.173797607421875, 0.1818084716796875, 0.1898193359375, 0.1978302001953125, 0.205841064453125, 0.2138519287109375, 0.22186279296875, 0.2298736572265625, 0.237884521484375, 0.2458953857421875, 0.25390625]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 4.0, 8.0, 10.0, 17.0, 40.0, 47.0, 86.0, 137.0, 218.0, 339.0, 622.0, 1053.0, 1635.0, 2666.0, 4607.0, 7645.0, 12929.0, 22002.0, 39036.0, 69812.0, 130305.0, 261864.0, 610857.0, 1542377.0, 814663.0, 323478.0, 156555.0, 82644.0, 45656.0, 25453.0, 15146.0, 8981.0, 5396.0, 3206.0, 1942.0, 1131.0, 686.0, 391.0, 262.0, 160.0, 86.0, 37.0, 31.0, 25.0, 10.0, 17.0, 6.0, 5.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0], "bins": [-0.47119140625, -0.457183837890625, -0.44317626953125, -0.429168701171875, -0.4151611328125, -0.401153564453125, -0.38714599609375, -0.373138427734375, -0.359130859375, -0.345123291015625, -0.33111572265625, -0.317108154296875, -0.3031005859375, -0.289093017578125, -0.27508544921875, -0.261077880859375, -0.2470703125, -0.233062744140625, -0.21905517578125, -0.205047607421875, -0.1910400390625, -0.177032470703125, -0.16302490234375, -0.149017333984375, -0.135009765625, -0.121002197265625, -0.10699462890625, -0.092987060546875, -0.0789794921875, -0.064971923828125, -0.05096435546875, -0.036956787109375, -0.02294921875, -0.008941650390625, 0.00506591796875, 0.019073486328125, 0.0330810546875, 0.047088623046875, 0.06109619140625, 0.075103759765625, 0.089111328125, 0.103118896484375, 0.11712646484375, 0.131134033203125, 0.1451416015625, 0.159149169921875, 0.17315673828125, 0.187164306640625, 0.201171875, 0.215179443359375, 0.22918701171875, 0.243194580078125, 0.2572021484375, 0.271209716796875, 0.28521728515625, 0.299224853515625, 0.313232421875, 0.327239990234375, 0.34124755859375, 0.355255126953125, 0.3692626953125, 0.383270263671875, 0.39727783203125, 0.411285400390625, 0.42529296875]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 10.0, 8.0, 14.0, 15.0, 30.0, 30.0, 23.0, 35.0, 50.0, 62.0, 77.0, 68.0, 116.0, 107.0, 149.0, 150.0, 201.0, 208.0, 218.0, 229.0, 277.0, 212.0, 237.0, 238.0, 201.0, 166.0, 148.0, 130.0, 123.0, 99.0, 78.0, 72.0, 66.0, 53.0, 28.0, 34.0, 16.0, 17.0, 16.0, 14.0, 12.0, 12.0, 9.0, 2.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.1370849609375, -0.13317012786865234, -0.1292552947998047, -0.12534046173095703, -0.12142562866210938, -0.11751079559326172, -0.11359596252441406, -0.1096811294555664, -0.10576629638671875, -0.1018514633178711, -0.09793663024902344, -0.09402179718017578, -0.09010696411132812, -0.08619213104248047, -0.08227729797363281, -0.07836246490478516, -0.0744476318359375, -0.07053279876708984, -0.06661796569824219, -0.06270313262939453, -0.058788299560546875, -0.05487346649169922, -0.05095863342285156, -0.047043800354003906, -0.04312896728515625, -0.039214134216308594, -0.03529930114746094, -0.03138446807861328, -0.027469635009765625, -0.02355480194091797, -0.019639968872070312, -0.015725135803222656, -0.011810302734375, -0.007895469665527344, -0.0039806365966796875, -6.580352783203125e-05, 0.003849029541015625, 0.007763862609863281, 0.011678695678710938, 0.015593528747558594, 0.01950836181640625, 0.023423194885253906, 0.027338027954101562, 0.03125286102294922, 0.035167694091796875, 0.03908252716064453, 0.04299736022949219, 0.046912193298339844, 0.0508270263671875, 0.054741859436035156, 0.05865669250488281, 0.06257152557373047, 0.06648635864257812, 0.07040119171142578, 0.07431602478027344, 0.0782308578491211, 0.08214569091796875, 0.0860605239868164, 0.08997535705566406, 0.09389019012451172, 0.09780502319335938, 0.10171985626220703, 0.10563468933105469, 0.10954952239990234, 0.11346435546875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 8.0, 9.0, 10.0, 7.0, 11.0, 14.0, 22.0, 25.0, 33.0, 42.0, 39.0, 69.0, 67.0, 87.0, 98.0, 79.0, 82.0, 44.0, 41.0, 45.0, 30.0, 26.0, 18.0, 18.0, 14.0, 10.0, 9.0, 5.0, 5.0, 3.0, 5.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.34995126724243164, -0.33881205320358276, -0.3276728391647339, -0.3165336549282074, -0.3053944408893585, -0.29425522685050964, -0.28311604261398315, -0.2719768285751343, -0.2608376145362854, -0.24969840049743652, -0.23855920135974884, -0.22742000222206116, -0.21628078818321228, -0.2051415741443634, -0.19400237500667572, -0.18286317586898804, -0.17172396183013916, -0.16058474779129028, -0.1494455486536026, -0.13830634951591492, -0.12716713547706604, -0.11602792888879776, -0.10488872230052948, -0.0937495157122612, -0.08261030912399292, -0.07147110253572464, -0.06033189594745636, -0.04919268935918808, -0.0380534827709198, -0.02691427618265152, -0.01577506959438324, -0.00463586300611496, 0.006503373384475708, 0.017642579972743988, 0.028781786561012268, 0.03992099314928055, 0.05106019973754883, 0.06219940632581711, 0.07333861291408539, 0.08447781950235367, 0.09561702609062195, 0.10675623267889023, 0.11789543926715851, 0.1290346384048462, 0.14017385244369507, 0.15131306648254395, 0.16245226562023163, 0.1735914647579193, 0.1847306787967682, 0.19586989283561707, 0.20700909197330475, 0.21814829111099243, 0.2292875051498413, 0.24042671918869019, 0.25156593322753906, 0.26270511746406555, 0.27384433150291443, 0.2849835455417633, 0.2961227297782898, 0.30726194381713867, 0.31840115785598755, 0.3295403718948364, 0.3406795859336853, 0.3518187701702118, 0.36295798420906067]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 9.0, 5.0, 5.0, 13.0, 8.0, 14.0, 15.0, 23.0, 21.0, 12.0, 31.0, 26.0, 30.0, 29.0, 36.0, 40.0, 41.0, 38.0, 51.0, 37.0, 36.0, 53.0, 39.0, 43.0, 38.0, 34.0, 29.0, 40.0, 28.0, 21.0, 22.0, 21.0, 19.0, 10.0, 17.0, 18.0, 13.0, 10.0, 12.0, 1.0, 3.0, 6.0, 2.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2661156952381134, -0.2570849359035492, -0.24805417656898499, -0.23902340233325958, -0.22999264299869537, -0.22096188366413116, -0.21193110942840576, -0.20290035009384155, -0.19386959075927734, -0.18483883142471313, -0.17580807209014893, -0.16677729785442352, -0.15774653851985931, -0.1487157791852951, -0.1396850049495697, -0.1306542456150055, -0.12162348628044128, -0.11259272694587708, -0.10356196016073227, -0.09453119337558746, -0.08550043404102325, -0.07646967470645905, -0.06743890792131424, -0.058408141136169434, -0.049377381801605225, -0.04034661874175072, -0.03131585568189621, -0.022285092622041702, -0.013254329562187195, -0.004223566502332687, 0.00480719655752182, 0.013837963342666626, 0.022868752479553223, 0.03189951553940773, 0.04093027859926224, 0.049961041659116745, 0.05899180471897125, 0.06802256405353546, 0.07705333083868027, 0.08608409762382507, 0.09511485695838928, 0.10414561629295349, 0.1131763830780983, 0.1222071498632431, 0.1312379091978073, 0.14026866853237152, 0.14929944276809692, 0.15833020210266113, 0.16736096143722534, 0.17639172077178955, 0.18542248010635376, 0.19445325434207916, 0.20348401367664337, 0.21251477301120758, 0.22154554724693298, 0.2305763065814972, 0.2396070659160614, 0.2486378252506256, 0.2576685845851898, 0.26669934391975403, 0.2757301330566406, 0.28476089239120483, 0.29379165172576904, 0.30282241106033325, 0.31185317039489746]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [5.0, 4.0, 5.0, 15.0, 20.0, 17.0, 22.0, 19.0, 35.0, 61.0, 77.0, 117.0, 187.0, 220.0, 339.0, 468.0, 720.0, 975.0, 1395.0, 2033.0, 3020.0, 4334.0, 6269.0, 9448.0, 14445.0, 22371.0, 35294.0, 59209.0, 104994.0, 193950.0, 244622.0, 140233.0, 77426.0, 44732.0, 27805.0, 17711.0, 11484.0, 7658.0, 5236.0, 3520.0, 2433.0, 1717.0, 1185.0, 812.0, 544.0, 406.0, 284.0, 213.0, 127.0, 127.0, 74.0, 48.0, 27.0, 24.0, 16.0, 16.0, 6.0, 6.0, 3.0, 3.0, 2.0, 4.0, 2.0, 2.0], "bins": [-0.118408203125, -0.11449241638183594, -0.11057662963867188, -0.10666084289550781, -0.10274505615234375, -0.09882926940917969, -0.09491348266601562, -0.09099769592285156, -0.0870819091796875, -0.08316612243652344, -0.07925033569335938, -0.07533454895019531, -0.07141876220703125, -0.06750297546386719, -0.06358718872070312, -0.05967140197753906, -0.055755615234375, -0.05183982849121094, -0.047924041748046875, -0.04400825500488281, -0.04009246826171875, -0.03617668151855469, -0.032260894775390625, -0.028345108032226562, -0.0244293212890625, -0.020513534545898438, -0.016597747802734375, -0.012681961059570312, -0.00876617431640625, -0.0048503875732421875, -0.000934600830078125, 0.0029811859130859375, 0.00689697265625, 0.010812759399414062, 0.014728546142578125, 0.018644332885742188, 0.02256011962890625, 0.026475906372070312, 0.030391693115234375, 0.03430747985839844, 0.0382232666015625, 0.04213905334472656, 0.046054840087890625, 0.04997062683105469, 0.05388641357421875, 0.05780220031738281, 0.061717987060546875, 0.06563377380371094, 0.069549560546875, 0.07346534729003906, 0.07738113403320312, 0.08129692077636719, 0.08521270751953125, 0.08912849426269531, 0.09304428100585938, 0.09696006774902344, 0.1008758544921875, 0.10479164123535156, 0.10870742797851562, 0.11262321472167969, 0.11653900146484375, 0.12045478820800781, 0.12437057495117188, 0.12828636169433594, 0.1322021484375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 8.0, 7.0, 7.0, 10.0, 13.0, 10.0, 11.0, 26.0, 22.0, 27.0, 35.0, 28.0, 38.0, 37.0, 38.0, 51.0, 47.0, 52.0, 49.0, 53.0, 37.0, 53.0, 44.0, 34.0, 27.0, 40.0, 35.0, 24.0, 23.0, 20.0, 14.0, 13.0, 18.0, 13.0, 14.0, 8.0, 3.0, 4.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30078125, -0.29064178466796875, -0.2805023193359375, -0.27036285400390625, -0.260223388671875, -0.25008392333984375, -0.2399444580078125, -0.22980499267578125, -0.21966552734375, -0.20952606201171875, -0.1993865966796875, -0.18924713134765625, -0.179107666015625, -0.16896820068359375, -0.1588287353515625, -0.14868927001953125, -0.1385498046875, -0.12841033935546875, -0.1182708740234375, -0.10813140869140625, -0.097991943359375, -0.08785247802734375, -0.0777130126953125, -0.06757354736328125, -0.05743408203125, -0.04729461669921875, -0.0371551513671875, -0.02701568603515625, -0.016876220703125, -0.00673675537109375, 0.0034027099609375, 0.01354217529296875, 0.023681640625, 0.03382110595703125, 0.0439605712890625, 0.05410003662109375, 0.064239501953125, 0.07437896728515625, 0.0845184326171875, 0.09465789794921875, 0.10479736328125, 0.11493682861328125, 0.1250762939453125, 0.13521575927734375, 0.145355224609375, 0.15549468994140625, 0.1656341552734375, 0.17577362060546875, 0.1859130859375, 0.19605255126953125, 0.2061920166015625, 0.21633148193359375, 0.226470947265625, 0.23661041259765625, 0.2467498779296875, 0.25688934326171875, 0.26702880859375, 0.27716827392578125, 0.2873077392578125, 0.29744720458984375, 0.307586669921875, 0.31772613525390625, 0.3278656005859375, 0.33800506591796875, 0.34814453125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [4.0, 5.0, 1.0, 0.0, 4.0, 9.0, 11.0, 25.0, 23.0, 41.0, 49.0, 50.0, 104.0, 129.0, 165.0, 241.0, 315.0, 466.0, 678.0, 946.0, 1245.0, 1883.0, 2650.0, 4030.0, 6318.0, 10462.0, 19252.0, 41311.0, 111542.0, 418589.0, 274921.0, 79352.0, 32011.0, 15596.0, 8800.0, 5475.0, 3593.0, 2408.0, 1732.0, 1230.0, 860.0, 592.0, 439.0, 318.0, 206.0, 131.0, 114.0, 70.0, 52.0, 37.0, 30.0, 17.0, 9.0, 10.0, 6.0, 2.0, 4.0, 6.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.19775390625, -0.19112777709960938, -0.18450164794921875, -0.17787551879882812, -0.1712493896484375, -0.16462326049804688, -0.15799713134765625, -0.15137100219726562, -0.144744873046875, -0.13811874389648438, -0.13149261474609375, -0.12486648559570312, -0.1182403564453125, -0.11161422729492188, -0.10498809814453125, -0.09836196899414062, -0.09173583984375, -0.08510971069335938, -0.07848358154296875, -0.07185745239257812, -0.0652313232421875, -0.058605194091796875, -0.05197906494140625, -0.045352935791015625, -0.038726806640625, -0.032100677490234375, -0.02547454833984375, -0.018848419189453125, -0.0122222900390625, -0.005596160888671875, 0.00102996826171875, 0.007656097412109375, 0.0142822265625, 0.020908355712890625, 0.02753448486328125, 0.034160614013671875, 0.0407867431640625, 0.047412872314453125, 0.05403900146484375, 0.060665130615234375, 0.067291259765625, 0.07391738891601562, 0.08054351806640625, 0.08716964721679688, 0.0937957763671875, 0.10042190551757812, 0.10704803466796875, 0.11367416381835938, 0.12030029296875, 0.12692642211914062, 0.13355255126953125, 0.14017868041992188, 0.1468048095703125, 0.15343093872070312, 0.16005706787109375, 0.16668319702148438, 0.173309326171875, 0.17993545532226562, 0.18656158447265625, 0.19318771362304688, 0.1998138427734375, 0.20643997192382812, 0.21306610107421875, 0.21969223022460938, 0.226318359375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 3.0, 4.0, 2.0, 5.0, 6.0, 7.0, 9.0, 11.0, 10.0, 14.0, 24.0, 18.0, 15.0, 32.0, 26.0, 32.0, 36.0, 30.0, 42.0, 40.0, 41.0, 37.0, 39.0, 31.0, 37.0, 25.0, 50.0, 33.0, 37.0, 36.0, 34.0, 39.0, 23.0, 21.0, 18.0, 13.0, 21.0, 22.0, 9.0, 15.0, 9.0, 12.0, 12.0, 4.0, 8.0, 5.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.171630859375, -0.1664257049560547, -0.16122055053710938, -0.15601539611816406, -0.15081024169921875, -0.14560508728027344, -0.14039993286132812, -0.1351947784423828, -0.1299896240234375, -0.12478446960449219, -0.11957931518554688, -0.11437416076660156, -0.10916900634765625, -0.10396385192871094, -0.09875869750976562, -0.09355354309082031, -0.088348388671875, -0.08314323425292969, -0.07793807983398438, -0.07273292541503906, -0.06752777099609375, -0.06232261657714844, -0.057117462158203125, -0.05191230773925781, -0.0467071533203125, -0.04150199890136719, -0.036296844482421875, -0.031091690063476562, -0.02588653564453125, -0.020681381225585938, -0.015476226806640625, -0.010271072387695312, -0.00506591796875, 0.0001392364501953125, 0.005344390869140625, 0.010549545288085938, 0.01575469970703125, 0.020959854125976562, 0.026165008544921875, 0.03137016296386719, 0.0365753173828125, 0.04178047180175781, 0.046985626220703125, 0.05219078063964844, 0.05739593505859375, 0.06260108947753906, 0.06780624389648438, 0.07301139831542969, 0.078216552734375, 0.08342170715332031, 0.08862686157226562, 0.09383201599121094, 0.09903717041015625, 0.10424232482910156, 0.10944747924804688, 0.11465263366699219, 0.1198577880859375, 0.1250629425048828, 0.13026809692382812, 0.13547325134277344, 0.14067840576171875, 0.14588356018066406, 0.15108871459960938, 0.1562938690185547, 0.1614990234375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 5.0, 11.0, 4.0, 10.0, 13.0, 17.0, 24.0, 22.0, 38.0, 51.0, 57.0, 108.0, 155.0, 189.0, 297.0, 402.0, 579.0, 897.0, 1397.0, 2172.0, 3751.0, 6606.0, 13803.0, 33681.0, 121329.0, 660217.0, 134913.0, 36052.0, 14384.0, 7029.0, 3700.0, 2298.0, 1376.0, 906.0, 603.0, 466.0, 298.0, 212.0, 121.0, 114.0, 62.0, 51.0, 45.0, 29.0, 27.0, 15.0, 8.0, 5.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.0148773193359375, -0.014373540878295898, -0.013869762420654297, -0.013365983963012695, -0.012862205505371094, -0.012358427047729492, -0.01185464859008789, -0.011350870132446289, -0.010847091674804688, -0.010343313217163086, -0.009839534759521484, -0.009335756301879883, -0.008831977844238281, -0.00832819938659668, -0.007824420928955078, -0.0073206424713134766, -0.006816864013671875, -0.0063130855560302734, -0.005809307098388672, -0.00530552864074707, -0.004801750183105469, -0.004297971725463867, -0.0037941932678222656, -0.003290414810180664, -0.0027866363525390625, -0.002282857894897461, -0.0017790794372558594, -0.0012753009796142578, -0.0007715225219726562, -0.0002677440643310547, 0.00023603439331054688, 0.0007398128509521484, 0.00124359130859375, 0.0017473697662353516, 0.002251148223876953, 0.0027549266815185547, 0.0032587051391601562, 0.003762483596801758, 0.004266262054443359, 0.004770040512084961, 0.0052738189697265625, 0.005777597427368164, 0.006281375885009766, 0.006785154342651367, 0.007288932800292969, 0.00779271125793457, 0.008296489715576172, 0.008800268173217773, 0.009304046630859375, 0.009807825088500977, 0.010311603546142578, 0.01081538200378418, 0.011319160461425781, 0.011822938919067383, 0.012326717376708984, 0.012830495834350586, 0.013334274291992188, 0.013838052749633789, 0.01434183120727539, 0.014845609664916992, 0.015349388122558594, 0.015853166580200195, 0.016356945037841797, 0.0168607234954834, 0.017364501953125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 7.0, 3.0, 6.0, 12.0, 32.0, 33.0, 48.0, 49.0, 69.0, 82.0, 94.0, 102.0, 99.0, 147.0, 54.0, 44.0, 37.0, 25.0, 18.0, 8.0, 8.0, 6.0, 6.0, 8.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2649765014648438e-06, -2.1988525986671448e-06, -2.132728695869446e-06, -2.066604793071747e-06, -2.000480890274048e-06, -1.934356987476349e-06, -1.86823308467865e-06, -1.802109181880951e-06, -1.735985279083252e-06, -1.669861376285553e-06, -1.603737473487854e-06, -1.537613570690155e-06, -1.471489667892456e-06, -1.405365765094757e-06, -1.339241862297058e-06, -1.2731179594993591e-06, -1.2069940567016602e-06, -1.1408701539039612e-06, -1.0747462511062622e-06, -1.0086223483085632e-06, -9.424984455108643e-07, -8.763745427131653e-07, -8.102506399154663e-07, -7.441267371177673e-07, -6.780028343200684e-07, -6.118789315223694e-07, -5.457550287246704e-07, -4.796311259269714e-07, -4.1350722312927246e-07, -3.473833203315735e-07, -2.812594175338745e-07, -2.1513551473617554e-07, -1.4901161193847656e-07, -8.288770914077759e-08, -1.6763806343078613e-08, 4.936009645462036e-08, 1.1548399925231934e-07, 1.816079020500183e-07, 2.477318048477173e-07, 3.1385570764541626e-07, 3.7997961044311523e-07, 4.461035132408142e-07, 5.122274160385132e-07, 5.783513188362122e-07, 6.444752216339111e-07, 7.105991244316101e-07, 7.767230272293091e-07, 8.428469300270081e-07, 9.08970832824707e-07, 9.75094735622406e-07, 1.041218638420105e-06, 1.107342541217804e-06, 1.173466444015503e-06, 1.239590346813202e-06, 1.3057142496109009e-06, 1.3718381524085999e-06, 1.4379620552062988e-06, 1.5040859580039978e-06, 1.5702098608016968e-06, 1.6363337635993958e-06, 1.7024576663970947e-06, 1.7685815691947937e-06, 1.8347054719924927e-06, 1.9008293747901917e-06, 1.9669532775878906e-06]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 6.0, 15.0, 21.0, 40.0, 50.0, 87.0, 119.0, 157.0, 238.0, 380.0, 580.0, 952.0, 1553.0, 2596.0, 4708.0, 8415.0, 16131.0, 34300.0, 87965.0, 353883.0, 373818.0, 90775.0, 35247.0, 16300.0, 8530.0, 4654.0, 2679.0, 1559.0, 1071.0, 579.0, 388.0, 268.0, 151.0, 112.0, 74.0, 55.0, 32.0, 26.0, 11.0, 9.0, 6.0, 4.0, 6.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.01690673828125, -0.016394615173339844, -0.015882492065429688, -0.015370368957519531, -0.014858245849609375, -0.014346122741699219, -0.013833999633789062, -0.013321876525878906, -0.01280975341796875, -0.012297630310058594, -0.011785507202148438, -0.011273384094238281, -0.010761260986328125, -0.010249137878417969, -0.009737014770507812, -0.009224891662597656, -0.0087127685546875, -0.008200645446777344, -0.0076885223388671875, -0.007176399230957031, -0.006664276123046875, -0.006152153015136719, -0.0056400299072265625, -0.005127906799316406, -0.00461578369140625, -0.004103660583496094, -0.0035915374755859375, -0.0030794143676757812, -0.002567291259765625, -0.0020551681518554688, -0.0015430450439453125, -0.0010309219360351562, -0.000518798828125, -6.67572021484375e-06, 0.0005054473876953125, 0.0010175704956054688, 0.001529693603515625, 0.0020418167114257812, 0.0025539398193359375, 0.0030660629272460938, 0.00357818603515625, 0.004090309143066406, 0.0046024322509765625, 0.005114555358886719, 0.005626678466796875, 0.006138801574707031, 0.0066509246826171875, 0.007163047790527344, 0.0076751708984375, 0.008187294006347656, 0.008699417114257812, 0.009211540222167969, 0.009723663330078125, 0.010235786437988281, 0.010747909545898438, 0.011260032653808594, 0.01177215576171875, 0.012284278869628906, 0.012796401977539062, 0.013308525085449219, 0.013820648193359375, 0.014332771301269531, 0.014844894409179688, 0.015357017517089844, 0.015869140625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 5.0, 1.0, 5.0, 3.0, 7.0, 6.0, 5.0, 5.0, 8.0, 8.0, 18.0, 7.0, 13.0, 14.0, 19.0, 33.0, 39.0, 32.0, 50.0, 103.0, 152.0, 127.0, 74.0, 56.0, 44.0, 31.0, 23.0, 13.0, 16.0, 12.0, 14.0, 10.0, 9.0, 8.0, 8.0, 2.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00672149658203125, -0.006522774696350098, -0.006324052810668945, -0.006125330924987793, -0.005926609039306641, -0.005727887153625488, -0.005529165267944336, -0.005330443382263184, -0.005131721496582031, -0.004932999610900879, -0.0047342777252197266, -0.004535555839538574, -0.004336833953857422, -0.0041381120681762695, -0.003939390182495117, -0.003740668296813965, -0.0035419464111328125, -0.00334322452545166, -0.003144502639770508, -0.0029457807540893555, -0.002747058868408203, -0.0025483369827270508, -0.0023496150970458984, -0.002150893211364746, -0.0019521713256835938, -0.0017534494400024414, -0.001554727554321289, -0.0013560056686401367, -0.0011572837829589844, -0.000958561897277832, -0.0007598400115966797, -0.0005611181259155273, -0.000362396240234375, -0.00016367435455322266, 3.504753112792969e-05, 0.00023376941680908203, 0.0004324913024902344, 0.0006312131881713867, 0.0008299350738525391, 0.0010286569595336914, 0.0012273788452148438, 0.001426100730895996, 0.0016248226165771484, 0.0018235445022583008, 0.002022266387939453, 0.0022209882736206055, 0.002419710159301758, 0.00261843204498291, 0.0028171539306640625, 0.003015875816345215, 0.003214597702026367, 0.0034133195877075195, 0.003612041473388672, 0.0038107633590698242, 0.0040094852447509766, 0.004208207130432129, 0.004406929016113281, 0.004605650901794434, 0.004804372787475586, 0.005003094673156738, 0.005201816558837891, 0.005400538444519043, 0.005599260330200195, 0.005797982215881348, 0.0059967041015625]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 1.0, 4.0, 4.0, 5.0, 4.0, 14.0, 8.0, 13.0, 8.0, 20.0, 23.0, 30.0, 43.0, 33.0, 48.0, 74.0, 81.0, 108.0, 89.0, 74.0, 61.0, 37.0, 40.0, 33.0, 25.0, 31.0, 18.0, 14.0, 10.0, 9.0, 8.0, 10.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3539390563964844, -0.34279918670654297, -0.33165931701660156, -0.32051947712898254, -0.30937960743904114, -0.29823973774909973, -0.2870998978614807, -0.2759600281715393, -0.2648201584815979, -0.2536802887916565, -0.24254043400287628, -0.23140057921409607, -0.22026070952415466, -0.20912083983421326, -0.19798098504543304, -0.18684113025665283, -0.17570126056671143, -0.16456139087677002, -0.1534215360879898, -0.1422816812992096, -0.1311418116092682, -0.12000194936990738, -0.10886208713054657, -0.09772222489118576, -0.08658236265182495, -0.07544250041246414, -0.06430263817310333, -0.05316277593374252, -0.042022913694381714, -0.030883051455020905, -0.019743189215660095, -0.008603326976299286, 0.0025365352630615234, 0.013676397502422333, 0.024816259741783142, 0.03595612198114395, 0.04709598422050476, 0.05823584645986557, 0.06937570869922638, 0.08051557093858719, 0.091655433177948, 0.10279529541730881, 0.11393515765666962, 0.12507501244544983, 0.13621488213539124, 0.14735475182533264, 0.15849460661411285, 0.16963446140289307, 0.18077433109283447, 0.19191420078277588, 0.2030540555715561, 0.2141939103603363, 0.2253337800502777, 0.23647364974021912, 0.24761350452899933, 0.25875335931777954, 0.26989322900772095, 0.28103309869766235, 0.29217296838760376, 0.3033128082752228, 0.3144526779651642, 0.3255925476551056, 0.3367323875427246, 0.347872257232666, 0.3590121269226074]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 3.0, 9.0, 6.0, 6.0, 13.0, 7.0, 14.0, 17.0, 22.0, 18.0, 14.0, 36.0, 22.0, 30.0, 34.0, 32.0, 39.0, 42.0, 37.0, 52.0, 40.0, 32.0, 56.0, 37.0, 40.0, 41.0, 32.0, 33.0, 35.0, 32.0, 20.0, 21.0, 21.0, 17.0, 12.0, 18.0, 19.0, 11.0, 9.0, 9.0, 3.0, 5.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2623614966869354, -0.25341925024986267, -0.2444770336151123, -0.23553480207920074, -0.22659257054328918, -0.21765032410621643, -0.20870809257030487, -0.1997658610343933, -0.19082362949848175, -0.1818813979625702, -0.17293916642665863, -0.16399693489074707, -0.15505468845367432, -0.14611247181892395, -0.1371702253818512, -0.12822799384593964, -0.11928576231002808, -0.11034353077411652, -0.10140129923820496, -0.0924590602517128, -0.08351682871580124, -0.07457459717988968, -0.06563235819339752, -0.05669012665748596, -0.0477478951215744, -0.03880566358566284, -0.029863428324460983, -0.020921194925904274, -0.011978961527347565, -0.0030367299914360046, 0.005905505269765854, 0.014847740530967712, 0.02379000186920166, 0.03273223340511322, 0.04167446866631508, 0.05061670392751694, 0.0595589354634285, 0.06850116699934006, 0.07744340598583221, 0.08638563752174377, 0.09532786905765533, 0.1042701005935669, 0.11321233212947845, 0.12215457111597061, 0.13109681010246277, 0.14003902673721313, 0.1489812731742859, 0.15792350471019745, 0.166865736246109, 0.17580796778202057, 0.18475019931793213, 0.1936924308538437, 0.20263466238975525, 0.211576908826828, 0.22051914036273956, 0.22946137189865112, 0.23840360343456268, 0.24734583497047424, 0.256288081407547, 0.26523029804229736, 0.2741725444793701, 0.2831147611141205, 0.29205700755119324, 0.3009992241859436, 0.30994147062301636]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 1.0, 6.0, 12.0, 14.0, 16.0, 29.0, 48.0, 73.0, 96.0, 147.0, 208.0, 322.0, 518.0, 772.0, 1064.0, 1674.0, 2450.0, 3647.0, 5355.0, 8358.0, 12959.0, 20087.0, 32150.0, 54032.0, 95338.0, 190135.0, 275795.0, 145149.0, 77126.0, 44654.0, 26817.0, 17066.0, 10897.0, 7223.0, 4768.0, 3221.0, 2039.0, 1403.0, 966.0, 665.0, 396.0, 284.0, 188.0, 146.0, 89.0, 52.0, 36.0, 22.0, 20.0, 9.0, 7.0, 6.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.49462890625, -0.4793243408203125, -0.464019775390625, -0.4487152099609375, -0.43341064453125, -0.4181060791015625, -0.402801513671875, -0.3874969482421875, -0.3721923828125, -0.3568878173828125, -0.341583251953125, -0.3262786865234375, -0.31097412109375, -0.2956695556640625, -0.280364990234375, -0.2650604248046875, -0.249755859375, -0.2344512939453125, -0.219146728515625, -0.2038421630859375, -0.18853759765625, -0.1732330322265625, -0.157928466796875, -0.1426239013671875, -0.1273193359375, -0.1120147705078125, -0.096710205078125, -0.0814056396484375, -0.06610107421875, -0.0507965087890625, -0.035491943359375, -0.0201873779296875, -0.0048828125, 0.0104217529296875, 0.025726318359375, 0.0410308837890625, 0.05633544921875, 0.0716400146484375, 0.086944580078125, 0.1022491455078125, 0.1175537109375, 0.1328582763671875, 0.148162841796875, 0.1634674072265625, 0.17877197265625, 0.1940765380859375, 0.209381103515625, 0.2246856689453125, 0.239990234375, 0.2552947998046875, 0.270599365234375, 0.2859039306640625, 0.30120849609375, 0.3165130615234375, 0.331817626953125, 0.3471221923828125, 0.3624267578125, 0.3777313232421875, 0.393035888671875, 0.4083404541015625, 0.42364501953125, 0.4389495849609375, 0.454254150390625, 0.4695587158203125, 0.48486328125]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 11.0, 6.0, 7.0, 10.0, 9.0, 9.0, 10.0, 18.0, 12.0, 19.0, 20.0, 22.0, 21.0, 24.0, 29.0, 36.0, 33.0, 35.0, 35.0, 45.0, 31.0, 42.0, 46.0, 34.0, 36.0, 37.0, 30.0, 30.0, 36.0, 26.0, 36.0, 25.0, 16.0, 19.0, 18.0, 17.0, 23.0, 15.0, 7.0, 17.0, 12.0, 5.0, 10.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22021484375, -0.21299362182617188, -0.20577239990234375, -0.19855117797851562, -0.1913299560546875, -0.18410873413085938, -0.17688751220703125, -0.16966629028320312, -0.162445068359375, -0.15522384643554688, -0.14800262451171875, -0.14078140258789062, -0.1335601806640625, -0.12633895874023438, -0.11911773681640625, -0.11189651489257812, -0.10467529296875, -0.09745407104492188, -0.09023284912109375, -0.08301162719726562, -0.0757904052734375, -0.06856918334960938, -0.06134796142578125, -0.054126739501953125, -0.046905517578125, -0.039684295654296875, -0.03246307373046875, -0.025241851806640625, -0.0180206298828125, -0.010799407958984375, -0.00357818603515625, 0.003643035888671875, 0.0108642578125, 0.018085479736328125, 0.02530670166015625, 0.032527923583984375, 0.0397491455078125, 0.046970367431640625, 0.05419158935546875, 0.061412811279296875, 0.068634033203125, 0.07585525512695312, 0.08307647705078125, 0.09029769897460938, 0.0975189208984375, 0.10474014282226562, 0.11196136474609375, 0.11918258666992188, 0.12640380859375, 0.13362503051757812, 0.14084625244140625, 0.14806747436523438, 0.1552886962890625, 0.16250991821289062, 0.16973114013671875, 0.17695236206054688, 0.184173583984375, 0.19139480590820312, 0.19861602783203125, 0.20583724975585938, 0.2130584716796875, 0.22027969360351562, 0.22750091552734375, 0.23472213745117188, 0.241943359375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 7.0, 8.0, 20.0, 23.0, 30.0, 38.0, 37.0, 91.0, 101.0, 183.0, 232.0, 376.0, 519.0, 730.0, 1165.0, 1743.0, 2629.0, 3696.0, 5742.0, 8530.0, 13225.0, 20443.0, 31955.0, 51677.0, 87435.0, 163343.0, 273720.0, 156905.0, 84220.0, 50319.0, 31147.0, 19839.0, 12934.0, 8542.0, 5632.0, 3672.0, 2511.0, 1628.0, 1131.0, 714.0, 512.0, 385.0, 252.0, 162.0, 120.0, 71.0, 52.0, 38.0, 25.0, 16.0, 23.0, 7.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.45751953125, -0.4425048828125, -0.427490234375, -0.4124755859375, -0.3974609375, -0.3824462890625, -0.367431640625, -0.3524169921875, -0.33740234375, -0.3223876953125, -0.307373046875, -0.2923583984375, -0.27734375, -0.2623291015625, -0.247314453125, -0.2322998046875, -0.21728515625, -0.2022705078125, -0.187255859375, -0.1722412109375, -0.1572265625, -0.1422119140625, -0.127197265625, -0.1121826171875, -0.09716796875, -0.0821533203125, -0.067138671875, -0.0521240234375, -0.037109375, -0.0220947265625, -0.007080078125, 0.0079345703125, 0.02294921875, 0.0379638671875, 0.052978515625, 0.0679931640625, 0.0830078125, 0.0980224609375, 0.113037109375, 0.1280517578125, 0.14306640625, 0.1580810546875, 0.173095703125, 0.1881103515625, 0.203125, 0.2181396484375, 0.233154296875, 0.2481689453125, 0.26318359375, 0.2781982421875, 0.293212890625, 0.3082275390625, 0.3232421875, 0.3382568359375, 0.353271484375, 0.3682861328125, 0.38330078125, 0.3983154296875, 0.413330078125, 0.4283447265625, 0.443359375, 0.4583740234375, 0.473388671875, 0.4884033203125, 0.50341796875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 7.0, 8.0, 6.0, 4.0, 5.0, 7.0, 6.0, 8.0, 10.0, 12.0, 18.0, 25.0, 23.0, 22.0, 25.0, 22.0, 26.0, 37.0, 28.0, 35.0, 43.0, 49.0, 39.0, 33.0, 48.0, 32.0, 31.0, 27.0, 46.0, 33.0, 31.0, 28.0, 32.0, 16.0, 22.0, 24.0, 23.0, 17.0, 20.0, 13.0, 15.0, 11.0, 8.0, 10.0, 3.0, 2.0, 4.0, 7.0, 3.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.154296875, -0.1495380401611328, -0.14477920532226562, -0.14002037048339844, -0.13526153564453125, -0.13050270080566406, -0.12574386596679688, -0.12098503112792969, -0.1162261962890625, -0.11146736145019531, -0.10670852661132812, -0.10194969177246094, -0.09719085693359375, -0.09243202209472656, -0.08767318725585938, -0.08291435241699219, -0.078155517578125, -0.07339668273925781, -0.06863784790039062, -0.06387901306152344, -0.05912017822265625, -0.05436134338378906, -0.049602508544921875, -0.04484367370605469, -0.0400848388671875, -0.03532600402832031, -0.030567169189453125, -0.025808334350585938, -0.02104949951171875, -0.016290664672851562, -0.011531829833984375, -0.0067729949951171875, -0.00201416015625, 0.0027446746826171875, 0.007503509521484375, 0.012262344360351562, 0.01702117919921875, 0.021780014038085938, 0.026538848876953125, 0.03129768371582031, 0.0360565185546875, 0.04081535339355469, 0.045574188232421875, 0.05033302307128906, 0.05509185791015625, 0.05985069274902344, 0.06460952758789062, 0.06936836242675781, 0.074127197265625, 0.07888603210449219, 0.08364486694335938, 0.08840370178222656, 0.09316253662109375, 0.09792137145996094, 0.10268020629882812, 0.10743904113769531, 0.1121978759765625, 0.11695671081542969, 0.12171554565429688, 0.12647438049316406, 0.13123321533203125, 0.13599205017089844, 0.14075088500976562, 0.1455097198486328, 0.1502685546875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 10.0, 8.0, 8.0, 17.0, 29.0, 29.0, 54.0, 50.0, 68.0, 99.0, 164.0, 234.0, 280.0, 357.0, 489.0, 629.0, 856.0, 1196.0, 1633.0, 2255.0, 3149.0, 4800.0, 7750.0, 13336.0, 29426.0, 117952.0, 763820.0, 51132.0, 18934.0, 10007.0, 5952.0, 3967.0, 2685.0, 1853.0, 1368.0, 999.0, 788.0, 562.0, 405.0, 312.0, 248.0, 156.0, 118.0, 99.0, 78.0, 63.0, 44.0, 20.0, 20.0, 22.0, 7.0, 10.0, 4.0, 5.0, 2.0, 3.0, 1.0], "bins": [-0.1097412109375, -0.10644054412841797, -0.10313987731933594, -0.0998392105102539, -0.09653854370117188, -0.09323787689208984, -0.08993721008300781, -0.08663654327392578, -0.08333587646484375, -0.08003520965576172, -0.07673454284667969, -0.07343387603759766, -0.07013320922851562, -0.0668325424194336, -0.06353187561035156, -0.06023120880126953, -0.0569305419921875, -0.05362987518310547, -0.05032920837402344, -0.047028541564941406, -0.043727874755859375, -0.040427207946777344, -0.03712654113769531, -0.03382587432861328, -0.03052520751953125, -0.02722454071044922, -0.023923873901367188, -0.020623207092285156, -0.017322540283203125, -0.014021873474121094, -0.010721206665039062, -0.007420539855957031, -0.004119873046875, -0.0008192062377929688, 0.0024814605712890625, 0.005782127380371094, 0.009082794189453125, 0.012383460998535156, 0.015684127807617188, 0.01898479461669922, 0.02228546142578125, 0.02558612823486328, 0.028886795043945312, 0.032187461853027344, 0.035488128662109375, 0.038788795471191406, 0.04208946228027344, 0.04539012908935547, 0.0486907958984375, 0.05199146270751953, 0.05529212951660156, 0.058592796325683594, 0.061893463134765625, 0.06519412994384766, 0.06849479675292969, 0.07179546356201172, 0.07509613037109375, 0.07839679718017578, 0.08169746398925781, 0.08499813079833984, 0.08829879760742188, 0.0915994644165039, 0.09490013122558594, 0.09820079803466797, 0.10150146484375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 11.0, 4.0, 12.0, 19.0, 28.0, 38.0, 66.0, 265.0, 224.0, 165.0, 35.0, 37.0, 14.0, 19.0, 10.0, 10.0, 7.0, 2.0, 3.0, 2.0, 9.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.993511199951172e-06, -3.841705620288849e-06, -3.689900040626526e-06, -3.538094460964203e-06, -3.38628888130188e-06, -3.234483301639557e-06, -3.082677721977234e-06, -2.930872142314911e-06, -2.779066562652588e-06, -2.627260982990265e-06, -2.475455403327942e-06, -2.323649823665619e-06, -2.171844244003296e-06, -2.020038664340973e-06, -1.86823308467865e-06, -1.716427505016327e-06, -1.564621925354004e-06, -1.412816345691681e-06, -1.261010766029358e-06, -1.109205186367035e-06, -9.57399606704712e-07, -8.055940270423889e-07, -6.537884473800659e-07, -5.019828677177429e-07, -3.501772880554199e-07, -1.9837170839309692e-07, -4.6566128730773926e-08, 1.0523945093154907e-07, 2.5704503059387207e-07, 4.0885061025619507e-07, 5.606561899185181e-07, 7.124617695808411e-07, 8.642673492431641e-07, 1.016072928905487e-06, 1.16787850856781e-06, 1.319684088230133e-06, 1.471489667892456e-06, 1.623295247554779e-06, 1.775100827217102e-06, 1.926906406879425e-06, 2.078711986541748e-06, 2.230517566204071e-06, 2.382323145866394e-06, 2.534128725528717e-06, 2.68593430519104e-06, 2.837739884853363e-06, 2.989545464515686e-06, 3.141351044178009e-06, 3.293156623840332e-06, 3.444962203502655e-06, 3.596767783164978e-06, 3.748573362827301e-06, 3.900378942489624e-06, 4.052184522151947e-06, 4.20399010181427e-06, 4.355795681476593e-06, 4.507601261138916e-06, 4.659406840801239e-06, 4.811212420463562e-06, 4.963018000125885e-06, 5.114823579788208e-06, 5.266629159450531e-06, 5.418434739112854e-06, 5.570240318775177e-06, 5.7220458984375e-06]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 10.0, 11.0, 8.0, 11.0, 16.0, 27.0, 36.0, 60.0, 83.0, 78.0, 142.0, 182.0, 208.0, 343.0, 435.0, 567.0, 784.0, 982.0, 1438.0, 1871.0, 2700.0, 3994.0, 6550.0, 12208.0, 35516.0, 815017.0, 116875.0, 21331.0, 9291.0, 5463.0, 3546.0, 2330.0, 1683.0, 1245.0, 909.0, 676.0, 511.0, 370.0, 275.0, 192.0, 154.0, 114.0, 85.0, 63.0, 48.0, 35.0, 21.0, 24.0, 14.0, 9.0, 7.0, 3.0, 5.0, 4.0, 0.0, 5.0], "bins": [-0.1854248046875, -0.17993927001953125, -0.1744537353515625, -0.16896820068359375, -0.163482666015625, -0.15799713134765625, -0.1525115966796875, -0.14702606201171875, -0.14154052734375, -0.13605499267578125, -0.1305694580078125, -0.12508392333984375, -0.119598388671875, -0.11411285400390625, -0.1086273193359375, -0.10314178466796875, -0.09765625, -0.09217071533203125, -0.0866851806640625, -0.08119964599609375, -0.075714111328125, -0.07022857666015625, -0.0647430419921875, -0.05925750732421875, -0.05377197265625, -0.04828643798828125, -0.0428009033203125, -0.03731536865234375, -0.031829833984375, -0.02634429931640625, -0.0208587646484375, -0.01537322998046875, -0.0098876953125, -0.00440216064453125, 0.0010833740234375, 0.00656890869140625, 0.012054443359375, 0.01753997802734375, 0.0230255126953125, 0.02851104736328125, 0.03399658203125, 0.03948211669921875, 0.0449676513671875, 0.05045318603515625, 0.055938720703125, 0.06142425537109375, 0.0669097900390625, 0.07239532470703125, 0.077880859375, 0.08336639404296875, 0.0888519287109375, 0.09433746337890625, 0.099822998046875, 0.10530853271484375, 0.1107940673828125, 0.11627960205078125, 0.12176513671875, 0.12725067138671875, 0.1327362060546875, 0.13822174072265625, 0.143707275390625, 0.14919281005859375, 0.1546783447265625, 0.16016387939453125, 0.1656494140625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 7.0, 9.0, 31.0, 58.0, 144.0, 559.0, 64.0, 25.0, 15.0, 15.0, 8.0, 7.0, 4.0, 4.0, 7.0, 4.0, 2.0, 1.0, 4.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054229736328125, -0.05243396759033203, -0.05063819885253906, -0.048842430114746094, -0.047046661376953125, -0.045250892639160156, -0.04345512390136719, -0.04165935516357422, -0.03986358642578125, -0.03806781768798828, -0.03627204895019531, -0.034476280212402344, -0.032680511474609375, -0.030884742736816406, -0.029088973999023438, -0.02729320526123047, -0.0254974365234375, -0.02370166778564453, -0.021905899047851562, -0.020110130310058594, -0.018314361572265625, -0.016518592834472656, -0.014722824096679688, -0.012927055358886719, -0.01113128662109375, -0.009335517883300781, -0.0075397491455078125, -0.005743980407714844, -0.003948211669921875, -0.0021524429321289062, -0.0003566741943359375, 0.0014390945434570312, 0.00323486328125, 0.005030632019042969, 0.0068264007568359375, 0.008622169494628906, 0.010417938232421875, 0.012213706970214844, 0.014009475708007812, 0.01580524444580078, 0.01760101318359375, 0.01939678192138672, 0.021192550659179688, 0.022988319396972656, 0.024784088134765625, 0.026579856872558594, 0.028375625610351562, 0.03017139434814453, 0.0319671630859375, 0.03376293182373047, 0.03555870056152344, 0.037354469299316406, 0.039150238037109375, 0.040946006774902344, 0.04274177551269531, 0.04453754425048828, 0.04633331298828125, 0.04812908172607422, 0.04992485046386719, 0.051720619201660156, 0.053516387939453125, 0.055312156677246094, 0.05710792541503906, 0.05890369415283203, 0.060699462890625]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 5.0, 7.0, 5.0, 10.0, 14.0, 13.0, 26.0, 27.0, 28.0, 35.0, 39.0, 41.0, 66.0, 84.0, 84.0, 93.0, 79.0, 73.0, 42.0, 42.0, 34.0, 22.0, 22.0, 17.0, 8.0, 8.0, 7.0, 7.0, 12.0, 2.0, 5.0, 8.0, 4.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.34180545806884766, -0.33202922344207764, -0.32225295901298523, -0.3124767243862152, -0.3027004897594452, -0.2929242253303528, -0.28314799070358276, -0.27337175607681274, -0.2635955214500427, -0.2538192868232727, -0.2440430372953415, -0.23426678776741028, -0.22449055314064026, -0.21471430361270905, -0.20493805408477783, -0.1951618194580078, -0.1853855550289154, -0.1756093055009842, -0.16583307087421417, -0.15605682134628296, -0.14628058671951294, -0.13650433719158173, -0.1267280876636505, -0.1169518455862999, -0.10717560350894928, -0.09739936143159866, -0.08762311935424805, -0.07784686982631683, -0.06807062774896622, -0.0582943856716156, -0.048518139868974686, -0.03874189406633377, -0.028965622186660767, -0.019189378246665, -0.009413134306669235, 0.00036310963332653046, 0.010139353573322296, 0.019915595650672913, 0.029691841453313828, 0.03946808725595474, 0.04924432933330536, 0.059020571410655975, 0.06879681348800659, 0.0785730630159378, 0.08834930509328842, 0.09812554717063904, 0.10790179669857025, 0.11767803877592087, 0.12745428085327148, 0.1372305303812027, 0.14700676500797272, 0.15678301453590393, 0.16655924916267395, 0.17633549869060516, 0.18611174821853638, 0.1958879828453064, 0.2056642323732376, 0.21544048190116882, 0.22521671652793884, 0.23499296605587006, 0.24476921558380127, 0.2545454502105713, 0.2643216848373413, 0.2740979492664337, 0.28387418389320374]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 9.0, 7.0, 10.0, 13.0, 10.0, 13.0, 15.0, 19.0, 24.0, 26.0, 26.0, 26.0, 31.0, 36.0, 35.0, 28.0, 44.0, 44.0, 47.0, 37.0, 43.0, 42.0, 40.0, 31.0, 48.0, 24.0, 33.0, 28.0, 28.0, 27.0, 26.0, 22.0, 14.0, 20.0, 10.0, 11.0, 11.0, 9.0, 7.0, 7.0, 6.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.262365460395813, -0.25388073921203613, -0.24539600312709808, -0.23691128194332123, -0.22842654585838318, -0.21994182467460632, -0.21145710349082947, -0.2029723823070526, -0.19448764622211456, -0.1860029250383377, -0.17751818895339966, -0.1690334677696228, -0.16054874658584595, -0.1520640105009079, -0.14357928931713104, -0.135094553232193, -0.12660983204841614, -0.11812510341405869, -0.10964037477970123, -0.10115565359592438, -0.09267092496156693, -0.08418619632720947, -0.07570147514343262, -0.06721674650907516, -0.05873201787471771, -0.05024728924036026, -0.041762564331293106, -0.03327783942222595, -0.0247931107878685, -0.016308382153511047, -0.007823657244443893, 0.0006610676646232605, 0.009145796298980713, 0.017630523070693016, 0.02611524984240532, 0.03459997475147247, 0.043084703385829926, 0.05156943202018738, 0.06005415692925453, 0.06853888183832169, 0.07702361047267914, 0.08550833910703659, 0.09399306774139404, 0.1024777889251709, 0.11096251755952835, 0.1194472461938858, 0.12793196737766266, 0.1364167034626007, 0.14490142464637756, 0.15338614583015442, 0.16187088191509247, 0.17035560309886932, 0.17884033918380737, 0.18732506036758423, 0.19580978155136108, 0.20429450273513794, 0.212779238820076, 0.22126396000385284, 0.2297486960887909, 0.23823341727256775, 0.2467181384563446, 0.25520288944244385, 0.2636876106262207, 0.27217233180999756, 0.2806570529937744]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 2.0, 6.0, 6.0, 13.0, 12.0, 22.0, 40.0, 43.0, 71.0, 101.0, 175.0, 264.0, 474.0, 756.0, 1315.0, 2136.0, 3660.0, 5940.0, 9913.0, 16393.0, 28069.0, 49576.0, 95297.0, 203903.0, 616680.0, 1934099.0, 764285.0, 229373.0, 104616.0, 53483.0, 30067.0, 17479.0, 10431.0, 5993.0, 3678.0, 2288.0, 1405.0, 827.0, 540.0, 307.0, 186.0, 115.0, 78.0, 49.0, 36.0, 28.0, 19.0, 13.0, 10.0, 6.0, 4.0, 1.0, 4.0, 1.0, 1.0], "bins": [-0.421142578125, -0.40895843505859375, -0.3967742919921875, -0.38459014892578125, -0.372406005859375, -0.36022186279296875, -0.3480377197265625, -0.33585357666015625, -0.32366943359375, -0.31148529052734375, -0.2993011474609375, -0.28711700439453125, -0.274932861328125, -0.26274871826171875, -0.2505645751953125, -0.23838043212890625, -0.2261962890625, -0.21401214599609375, -0.2018280029296875, -0.18964385986328125, -0.177459716796875, -0.16527557373046875, -0.1530914306640625, -0.14090728759765625, -0.12872314453125, -0.11653900146484375, -0.1043548583984375, -0.09217071533203125, -0.079986572265625, -0.06780242919921875, -0.0556182861328125, -0.04343414306640625, -0.03125, -0.01906585693359375, -0.0068817138671875, 0.00530242919921875, 0.017486572265625, 0.02967071533203125, 0.0418548583984375, 0.05403900146484375, 0.06622314453125, 0.07840728759765625, 0.0905914306640625, 0.10277557373046875, 0.114959716796875, 0.12714385986328125, 0.1393280029296875, 0.15151214599609375, 0.1636962890625, 0.17588043212890625, 0.1880645751953125, 0.20024871826171875, 0.212432861328125, 0.22461700439453125, 0.2368011474609375, 0.24898529052734375, 0.26116943359375, 0.27335357666015625, 0.2855377197265625, 0.29772186279296875, 0.309906005859375, 0.32209014892578125, 0.3342742919921875, 0.34645843505859375, 0.358642578125]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 4.0, 11.0, 6.0, 15.0, 16.0, 4.0, 12.0, 26.0, 19.0, 20.0, 25.0, 25.0, 28.0, 40.0, 36.0, 35.0, 42.0, 41.0, 40.0, 47.0, 42.0, 50.0, 54.0, 37.0, 41.0, 39.0, 39.0, 29.0, 19.0, 23.0, 21.0, 20.0, 15.0, 10.0, 12.0, 17.0, 14.0, 7.0, 4.0, 5.0, 6.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1767578125, -0.1713714599609375, -0.165985107421875, -0.1605987548828125, -0.15521240234375, -0.1498260498046875, -0.144439697265625, -0.1390533447265625, -0.1336669921875, -0.1282806396484375, -0.122894287109375, -0.1175079345703125, -0.11212158203125, -0.1067352294921875, -0.101348876953125, -0.0959625244140625, -0.090576171875, -0.0851898193359375, -0.079803466796875, -0.0744171142578125, -0.06903076171875, -0.0636444091796875, -0.058258056640625, -0.0528717041015625, -0.0474853515625, -0.0420989990234375, -0.036712646484375, -0.0313262939453125, -0.02593994140625, -0.0205535888671875, -0.015167236328125, -0.0097808837890625, -0.00439453125, 0.0009918212890625, 0.006378173828125, 0.0117645263671875, 0.01715087890625, 0.0225372314453125, 0.027923583984375, 0.0333099365234375, 0.0386962890625, 0.0440826416015625, 0.049468994140625, 0.0548553466796875, 0.06024169921875, 0.0656280517578125, 0.071014404296875, 0.0764007568359375, 0.081787109375, 0.0871734619140625, 0.092559814453125, 0.0979461669921875, 0.10333251953125, 0.1087188720703125, 0.114105224609375, 0.1194915771484375, 0.1248779296875, 0.1302642822265625, 0.135650634765625, 0.1410369873046875, 0.14642333984375, 0.1518096923828125, 0.157196044921875, 0.1625823974609375, 0.16796875]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 14.0, 9.0, 22.0, 22.0, 34.0, 43.0, 69.0, 95.0, 188.0, 228.0, 336.0, 541.0, 775.0, 1289.0, 2082.0, 3364.0, 5773.0, 9517.0, 16497.0, 28818.0, 51177.0, 94904.0, 184968.0, 395525.0, 1098049.0, 1375523.0, 469569.0, 212223.0, 107646.0, 57372.0, 32037.0, 18264.0, 10877.0, 6309.0, 3703.0, 2231.0, 1415.0, 953.0, 608.0, 403.0, 262.0, 177.0, 122.0, 74.0, 50.0, 50.0, 19.0, 30.0, 9.0, 8.0, 7.0, 0.0, 3.0, 3.0, 1.0, 2.0], "bins": [-0.305419921875, -0.2961921691894531, -0.28696441650390625, -0.2777366638183594, -0.2685089111328125, -0.2592811584472656, -0.25005340576171875, -0.24082565307617188, -0.231597900390625, -0.22237014770507812, -0.21314239501953125, -0.20391464233398438, -0.1946868896484375, -0.18545913696289062, -0.17623138427734375, -0.16700363159179688, -0.15777587890625, -0.14854812622070312, -0.13932037353515625, -0.13009262084960938, -0.1208648681640625, -0.11163711547851562, -0.10240936279296875, -0.09318161010742188, -0.083953857421875, -0.07472610473632812, -0.06549835205078125, -0.056270599365234375, -0.0470428466796875, -0.037815093994140625, -0.02858734130859375, -0.019359588623046875, -0.0101318359375, -0.000904083251953125, 0.00832366943359375, 0.017551422119140625, 0.0267791748046875, 0.036006927490234375, 0.04523468017578125, 0.054462432861328125, 0.063690185546875, 0.07291793823242188, 0.08214569091796875, 0.09137344360351562, 0.1006011962890625, 0.10982894897460938, 0.11905670166015625, 0.12828445434570312, 0.13751220703125, 0.14673995971679688, 0.15596771240234375, 0.16519546508789062, 0.1744232177734375, 0.18365097045898438, 0.19287872314453125, 0.20210647583007812, 0.211334228515625, 0.22056198120117188, 0.22978973388671875, 0.23901748657226562, 0.2482452392578125, 0.2574729919433594, 0.26670074462890625, 0.2759284973144531, 0.28515625]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 5.0, 10.0, 17.0, 23.0, 18.0, 31.0, 39.0, 36.0, 36.0, 48.0, 92.0, 79.0, 81.0, 97.0, 140.0, 157.0, 192.0, 208.0, 251.0, 232.0, 310.0, 288.0, 249.0, 216.0, 170.0, 174.0, 144.0, 124.0, 114.0, 95.0, 88.0, 51.0, 65.0, 29.0, 38.0, 30.0, 26.0, 19.0, 20.0, 3.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.09112548828125, -0.0884389877319336, -0.08575248718261719, -0.08306598663330078, -0.08037948608398438, -0.07769298553466797, -0.07500648498535156, -0.07231998443603516, -0.06963348388671875, -0.06694698333740234, -0.06426048278808594, -0.06157398223876953, -0.058887481689453125, -0.05620098114013672, -0.05351448059082031, -0.050827980041503906, -0.0481414794921875, -0.045454978942871094, -0.04276847839355469, -0.04008197784423828, -0.037395477294921875, -0.03470897674560547, -0.03202247619628906, -0.029335975646972656, -0.02664947509765625, -0.023962974548339844, -0.021276473999023438, -0.01858997344970703, -0.015903472900390625, -0.013216972351074219, -0.010530471801757812, -0.007843971252441406, -0.005157470703125, -0.0024709701538085938, 0.0002155303955078125, 0.0029020309448242188, 0.005588531494140625, 0.008275032043457031, 0.010961532592773438, 0.013648033142089844, 0.01633453369140625, 0.019021034240722656, 0.021707534790039062, 0.02439403533935547, 0.027080535888671875, 0.02976703643798828, 0.03245353698730469, 0.035140037536621094, 0.0378265380859375, 0.040513038635253906, 0.04319953918457031, 0.04588603973388672, 0.048572540283203125, 0.05125904083251953, 0.05394554138183594, 0.056632041931152344, 0.05931854248046875, 0.062005043029785156, 0.06469154357910156, 0.06737804412841797, 0.07006454467773438, 0.07275104522705078, 0.07543754577636719, 0.0781240463256836, 0.080810546875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 3.0, 4.0, 5.0, 7.0, 11.0, 10.0, 17.0, 20.0, 26.0, 34.0, 40.0, 33.0, 58.0, 92.0, 87.0, 120.0, 86.0, 67.0, 56.0, 47.0, 37.0, 33.0, 22.0, 22.0, 15.0, 7.0, 15.0, 5.0, 6.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26629164814949036, -0.2583143413066864, -0.25033700466156006, -0.2423596978187561, -0.23438237607479095, -0.2264050543308258, -0.21842774748802185, -0.2104504257440567, -0.20247310400009155, -0.1944957822561264, -0.18651847541332245, -0.1785411536693573, -0.17056383192539215, -0.162586510181427, -0.15460920333862305, -0.1466318815946579, -0.13865457475185394, -0.1306772530078888, -0.12269993871450424, -0.11472262442111969, -0.10674530267715454, -0.09876798838376999, -0.09079067409038544, -0.08281335234642029, -0.07483603805303574, -0.06685872375965118, -0.058881402015686035, -0.05090408772230148, -0.04292676970362663, -0.03494945168495178, -0.02697213739156723, -0.01899481937289238, -0.011017486453056335, -0.0030401693657040596, 0.004937147721648216, 0.012914463877677917, 0.020891781896352768, 0.02886909991502762, 0.03684641420841217, 0.04482373222708702, 0.05280105024576187, 0.06077836826443672, 0.06875568628311157, 0.07673300057649612, 0.08471031486988068, 0.09268763661384583, 0.10066495090723038, 0.10864226520061493, 0.11661958694458008, 0.12459690123796463, 0.13257421553134918, 0.14055153727531433, 0.14852885901927948, 0.15650618076324463, 0.16448348760604858, 0.17246080935001373, 0.18043813109397888, 0.18841545283794403, 0.19639275968074799, 0.20437008142471313, 0.21234740316867828, 0.22032472491264343, 0.2283020317554474, 0.23627935349941254, 0.2442566603422165]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 8.0, 8.0, 9.0, 9.0, 12.0, 14.0, 21.0, 28.0, 28.0, 31.0, 27.0, 31.0, 27.0, 36.0, 29.0, 42.0, 39.0, 37.0, 43.0, 39.0, 47.0, 39.0, 34.0, 35.0, 40.0, 36.0, 28.0, 21.0, 32.0, 20.0, 25.0, 15.0, 22.0, 11.0, 17.0, 18.0, 13.0, 4.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.19953183829784393, -0.19381652772426605, -0.18810123205184937, -0.18238592147827148, -0.1766706109046936, -0.17095531523227692, -0.16524000465869904, -0.15952470898628235, -0.15380939841270447, -0.1480940878391266, -0.1423787921667099, -0.13666348159313202, -0.13094818592071533, -0.12523287534713745, -0.11951756477355957, -0.11380226165056229, -0.108086958527565, -0.10237165540456772, -0.09665635228157043, -0.09094104170799255, -0.08522573858499527, -0.07951043546199799, -0.0737951248884201, -0.06807982176542282, -0.06236451864242554, -0.05664921551942825, -0.05093390867114067, -0.04521860182285309, -0.039503298699855804, -0.03378799557685852, -0.028072688728570938, -0.022357381880283356, -0.016642078757286072, -0.010926773771643639, -0.0052114687860012054, 0.0005038361996412277, 0.006219141185283661, 0.011934446170926094, 0.017649751156568527, 0.02336505800485611, 0.029080361127853394, 0.03479566425085068, 0.04051097109913826, 0.04622627794742584, 0.051941581070423126, 0.05765688419342041, 0.06337219476699829, 0.06908749788999557, 0.07480280101299286, 0.08051810413599014, 0.08623340725898743, 0.09194871783256531, 0.09766402095556259, 0.10337932407855988, 0.10909463465213776, 0.11480993777513504, 0.12052524089813232, 0.1262405514717102, 0.1319558471441269, 0.13767115771770477, 0.14338645339012146, 0.14910176396369934, 0.15481707453727722, 0.1605323851108551, 0.1662476807832718]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 2.0, 8.0, 4.0, 7.0, 11.0, 20.0, 35.0, 41.0, 57.0, 114.0, 163.0, 298.0, 421.0, 705.0, 1233.0, 2031.0, 3332.0, 5377.0, 8742.0, 14992.0, 26901.0, 51024.0, 110206.0, 269535.0, 303186.0, 123878.0, 56532.0, 29291.0, 16128.0, 9555.0, 5738.0, 3537.0, 2104.0, 1341.0, 751.0, 480.0, 289.0, 157.0, 116.0, 82.0, 44.0, 19.0, 25.0, 11.0, 8.0, 10.0, 7.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1126708984375, -0.10915756225585938, -0.10564422607421875, -0.10213088989257812, -0.0986175537109375, -0.09510421752929688, -0.09159088134765625, -0.08807754516601562, -0.084564208984375, -0.08105087280273438, -0.07753753662109375, -0.07402420043945312, -0.0705108642578125, -0.06699752807617188, -0.06348419189453125, -0.059970855712890625, -0.05645751953125, -0.052944183349609375, -0.04943084716796875, -0.045917510986328125, -0.0424041748046875, -0.038890838623046875, -0.03537750244140625, -0.031864166259765625, -0.028350830078125, -0.024837493896484375, -0.02132415771484375, -0.017810821533203125, -0.0142974853515625, -0.010784149169921875, -0.00727081298828125, -0.003757476806640625, -0.000244140625, 0.003269195556640625, 0.00678253173828125, 0.010295867919921875, 0.0138092041015625, 0.017322540283203125, 0.02083587646484375, 0.024349212646484375, 0.027862548828125, 0.031375885009765625, 0.03488922119140625, 0.038402557373046875, 0.0419158935546875, 0.045429229736328125, 0.04894256591796875, 0.052455902099609375, 0.05596923828125, 0.059482574462890625, 0.06299591064453125, 0.06650924682617188, 0.0700225830078125, 0.07353591918945312, 0.07704925537109375, 0.08056259155273438, 0.084075927734375, 0.08758926391601562, 0.09110260009765625, 0.09461593627929688, 0.0981292724609375, 0.10164260864257812, 0.10515594482421875, 0.10866928100585938, 0.1121826171875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 5.0, 6.0, 10.0, 6.0, 15.0, 13.0, 21.0, 17.0, 30.0, 24.0, 21.0, 28.0, 30.0, 46.0, 26.0, 35.0, 32.0, 38.0, 33.0, 41.0, 34.0, 44.0, 41.0, 32.0, 39.0, 38.0, 33.0, 32.0, 24.0, 26.0, 20.0, 18.0, 16.0, 23.0, 8.0, 13.0, 17.0, 15.0, 17.0, 11.0, 7.0, 6.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.1951904296875, -0.18968582153320312, -0.18418121337890625, -0.17867660522460938, -0.1731719970703125, -0.16766738891601562, -0.16216278076171875, -0.15665817260742188, -0.151153564453125, -0.14564895629882812, -0.14014434814453125, -0.13463973999023438, -0.1291351318359375, -0.12363052368164062, -0.11812591552734375, -0.11262130737304688, -0.10711669921875, -0.10161209106445312, -0.09610748291015625, -0.09060287475585938, -0.0850982666015625, -0.07959365844726562, -0.07408905029296875, -0.06858444213867188, -0.063079833984375, -0.057575225830078125, -0.05207061767578125, -0.046566009521484375, -0.0410614013671875, -0.035556793212890625, -0.03005218505859375, -0.024547576904296875, -0.01904296875, -0.013538360595703125, -0.00803375244140625, -0.002529144287109375, 0.0029754638671875, 0.008480072021484375, 0.01398468017578125, 0.019489288330078125, 0.024993896484375, 0.030498504638671875, 0.03600311279296875, 0.041507720947265625, 0.0470123291015625, 0.052516937255859375, 0.05802154541015625, 0.06352615356445312, 0.06903076171875, 0.07453536987304688, 0.08003997802734375, 0.08554458618164062, 0.0910491943359375, 0.09655380249023438, 0.10205841064453125, 0.10756301879882812, 0.113067626953125, 0.11857223510742188, 0.12407684326171875, 0.12958145141601562, 0.1350860595703125, 0.14059066772460938, 0.14609527587890625, 0.15159988403320312, 0.1571044921875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 12.0, 15.0, 23.0, 20.0, 22.0, 50.0, 62.0, 101.0, 156.0, 184.0, 267.0, 403.0, 545.0, 763.0, 1024.0, 1403.0, 2086.0, 3070.0, 4689.0, 7545.0, 13745.0, 28788.0, 76649.0, 307870.0, 426623.0, 97299.0, 34579.0, 15760.0, 8525.0, 5134.0, 3447.0, 2270.0, 1574.0, 1105.0, 795.0, 556.0, 417.0, 326.0, 180.0, 124.0, 90.0, 84.0, 53.0, 27.0, 33.0, 16.0, 18.0, 10.0, 9.0, 7.0, 3.0, 2.0, 1.0, 3.0], "bins": [-0.169189453125, -0.1642284393310547, -0.15926742553710938, -0.15430641174316406, -0.14934539794921875, -0.14438438415527344, -0.13942337036132812, -0.1344623565673828, -0.1295013427734375, -0.12454032897949219, -0.11957931518554688, -0.11461830139160156, -0.10965728759765625, -0.10469627380371094, -0.09973526000976562, -0.09477424621582031, -0.089813232421875, -0.08485221862792969, -0.07989120483398438, -0.07493019104003906, -0.06996917724609375, -0.06500816345214844, -0.060047149658203125, -0.05508613586425781, -0.0501251220703125, -0.04516410827636719, -0.040203094482421875, -0.03524208068847656, -0.03028106689453125, -0.025320053100585938, -0.020359039306640625, -0.015398025512695312, -0.01043701171875, -0.0054759979248046875, -0.000514984130859375, 0.0044460296630859375, 0.00940704345703125, 0.014368057250976562, 0.019329071044921875, 0.024290084838867188, 0.0292510986328125, 0.03421211242675781, 0.039173126220703125, 0.04413414001464844, 0.04909515380859375, 0.05405616760253906, 0.059017181396484375, 0.06397819519042969, 0.068939208984375, 0.07390022277832031, 0.07886123657226562, 0.08382225036621094, 0.08878326416015625, 0.09374427795410156, 0.09870529174804688, 0.10366630554199219, 0.1086273193359375, 0.11358833312988281, 0.11854934692382812, 0.12351036071777344, 0.12847137451171875, 0.13343238830566406, 0.13839340209960938, 0.1433544158935547, 0.1483154296875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 8.0, 2.0, 7.0, 9.0, 9.0, 11.0, 10.0, 11.0, 22.0, 21.0, 15.0, 22.0, 31.0, 19.0, 22.0, 40.0, 38.0, 32.0, 39.0, 39.0, 37.0, 38.0, 48.0, 43.0, 38.0, 43.0, 38.0, 40.0, 34.0, 28.0, 27.0, 29.0, 20.0, 16.0, 21.0, 18.0, 18.0, 15.0, 8.0, 5.0, 10.0, 5.0, 3.0, 6.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.124755859375, -0.12107086181640625, -0.1173858642578125, -0.11370086669921875, -0.110015869140625, -0.10633087158203125, -0.1026458740234375, -0.09896087646484375, -0.09527587890625, -0.09159088134765625, -0.0879058837890625, -0.08422088623046875, -0.080535888671875, -0.07685089111328125, -0.0731658935546875, -0.06948089599609375, -0.0657958984375, -0.06211090087890625, -0.0584259033203125, -0.05474090576171875, -0.051055908203125, -0.04737091064453125, -0.0436859130859375, -0.04000091552734375, -0.03631591796875, -0.03263092041015625, -0.0289459228515625, -0.02526092529296875, -0.021575927734375, -0.01789093017578125, -0.0142059326171875, -0.01052093505859375, -0.0068359375, -0.00315093994140625, 0.0005340576171875, 0.00421905517578125, 0.007904052734375, 0.01158905029296875, 0.0152740478515625, 0.01895904541015625, 0.02264404296875, 0.02632904052734375, 0.0300140380859375, 0.03369903564453125, 0.037384033203125, 0.04106903076171875, 0.0447540283203125, 0.04843902587890625, 0.0521240234375, 0.05580902099609375, 0.0594940185546875, 0.06317901611328125, 0.066864013671875, 0.07054901123046875, 0.0742340087890625, 0.07791900634765625, 0.08160400390625, 0.08528900146484375, 0.0889739990234375, 0.09265899658203125, 0.096343994140625, 0.10002899169921875, 0.1037139892578125, 0.10739898681640625, 0.111083984375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 7.0, 8.0, 15.0, 15.0, 21.0, 31.0, 42.0, 64.0, 79.0, 114.0, 141.0, 211.0, 288.0, 433.0, 726.0, 1141.0, 1813.0, 3132.0, 5653.0, 11167.0, 26075.0, 83926.0, 615872.0, 215412.0, 46263.0, 17106.0, 7995.0, 4243.0, 2423.0, 1461.0, 898.0, 558.0, 350.0, 235.0, 182.0, 132.0, 82.0, 56.0, 49.0, 32.0, 36.0, 14.0, 13.0, 14.0, 12.0, 8.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0149993896484375, -0.0145416259765625, -0.0140838623046875, -0.0136260986328125, -0.0131683349609375, -0.0127105712890625, -0.0122528076171875, -0.0117950439453125, -0.0113372802734375, -0.0108795166015625, -0.0104217529296875, -0.0099639892578125, -0.0095062255859375, -0.0090484619140625, -0.0085906982421875, -0.0081329345703125, -0.0076751708984375, -0.0072174072265625, -0.0067596435546875, -0.0063018798828125, -0.0058441162109375, -0.0053863525390625, -0.0049285888671875, -0.0044708251953125, -0.0040130615234375, -0.0035552978515625, -0.0030975341796875, -0.0026397705078125, -0.0021820068359375, -0.0017242431640625, -0.0012664794921875, -0.0008087158203125, -0.0003509521484375, 0.0001068115234375, 0.0005645751953125, 0.0010223388671875, 0.0014801025390625, 0.0019378662109375, 0.0023956298828125, 0.0028533935546875, 0.0033111572265625, 0.0037689208984375, 0.0042266845703125, 0.0046844482421875, 0.0051422119140625, 0.0055999755859375, 0.0060577392578125, 0.0065155029296875, 0.0069732666015625, 0.0074310302734375, 0.0078887939453125, 0.0083465576171875, 0.0088043212890625, 0.0092620849609375, 0.0097198486328125, 0.0101776123046875, 0.0106353759765625, 0.0110931396484375, 0.0115509033203125, 0.0120086669921875, 0.0124664306640625, 0.0129241943359375, 0.0133819580078125, 0.0138397216796875, 0.0142974853515625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 0.0, 1.0, 1.0, 5.0, 3.0, 1.0, 11.0, 11.0, 9.0, 24.0, 18.0, 27.0, 26.0, 60.0, 46.0, 68.0, 89.0, 80.0, 90.0, 86.0, 86.0, 70.0, 56.0, 30.0, 33.0, 22.0, 16.0, 15.0, 7.0, 2.0, 4.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.562999725341797e-06, -2.5015324354171753e-06, -2.4400651454925537e-06, -2.378597855567932e-06, -2.3171305656433105e-06, -2.255663275718689e-06, -2.1941959857940674e-06, -2.132728695869446e-06, -2.0712614059448242e-06, -2.0097941160202026e-06, -1.948326826095581e-06, -1.8868595361709595e-06, -1.8253922462463379e-06, -1.7639249563217163e-06, -1.7024576663970947e-06, -1.6409903764724731e-06, -1.5795230865478516e-06, -1.51805579662323e-06, -1.4565885066986084e-06, -1.3951212167739868e-06, -1.3336539268493652e-06, -1.2721866369247437e-06, -1.210719347000122e-06, -1.1492520570755005e-06, -1.087784767150879e-06, -1.0263174772262573e-06, -9.648501873016357e-07, -9.033828973770142e-07, -8.419156074523926e-07, -7.80448317527771e-07, -7.189810276031494e-07, -6.575137376785278e-07, -5.960464477539062e-07, -5.345791578292847e-07, -4.731118679046631e-07, -4.116445779800415e-07, -3.501772880554199e-07, -2.8870999813079834e-07, -2.2724270820617676e-07, -1.6577541828155518e-07, -1.043081283569336e-07, -4.284083843231201e-08, 1.862645149230957e-08, 8.009374141693115e-08, 1.4156103134155273e-07, 2.0302832126617432e-07, 2.644956111907959e-07, 3.259629011154175e-07, 3.8743019104003906e-07, 4.4889748096466064e-07, 5.103647708892822e-07, 5.718320608139038e-07, 6.332993507385254e-07, 6.94766640663147e-07, 7.562339305877686e-07, 8.177012205123901e-07, 8.791685104370117e-07, 9.406358003616333e-07, 1.0021030902862549e-06, 1.0635703802108765e-06, 1.125037670135498e-06, 1.1865049600601196e-06, 1.2479722499847412e-06, 1.3094395399093628e-06, 1.3709068298339844e-06]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 7.0, 9.0, 7.0, 17.0, 17.0, 40.0, 56.0, 93.0, 91.0, 167.0, 256.0, 420.0, 626.0, 865.0, 1365.0, 2143.0, 3285.0, 5210.0, 8659.0, 14172.0, 23919.0, 42990.0, 87289.0, 240371.0, 371203.0, 118226.0, 53911.0, 28638.0, 17025.0, 10062.0, 6228.0, 3965.0, 2419.0, 1632.0, 1077.0, 697.0, 473.0, 311.0, 213.0, 141.0, 91.0, 55.0, 36.0, 32.0, 22.0, 12.0, 12.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.009490966796875, -0.009186506271362305, -0.00888204574584961, -0.008577585220336914, -0.008273124694824219, -0.007968664169311523, -0.007664203643798828, -0.007359743118286133, -0.0070552825927734375, -0.006750822067260742, -0.006446361541748047, -0.0061419010162353516, -0.005837440490722656, -0.005532979965209961, -0.005228519439697266, -0.00492405891418457, -0.004619598388671875, -0.00431513786315918, -0.004010677337646484, -0.003706216812133789, -0.0034017562866210938, -0.0030972957611083984, -0.002792835235595703, -0.002488374710083008, -0.0021839141845703125, -0.0018794536590576172, -0.0015749931335449219, -0.0012705326080322266, -0.0009660720825195312, -0.0006616115570068359, -0.0003571510314941406, -5.269050598144531e-05, 0.00025177001953125, 0.0005562305450439453, 0.0008606910705566406, 0.001165151596069336, 0.0014696121215820312, 0.0017740726470947266, 0.002078533172607422, 0.002382993698120117, 0.0026874542236328125, 0.002991914749145508, 0.003296375274658203, 0.0036008358001708984, 0.0039052963256835938, 0.004209756851196289, 0.004514217376708984, 0.00481867790222168, 0.005123138427734375, 0.00542759895324707, 0.005732059478759766, 0.006036520004272461, 0.006340980529785156, 0.0066454410552978516, 0.006949901580810547, 0.007254362106323242, 0.0075588226318359375, 0.007863283157348633, 0.008167743682861328, 0.008472204208374023, 0.008776664733886719, 0.009081125259399414, 0.00938558578491211, 0.009690046310424805, 0.0099945068359375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 0.0, 3.0, 7.0, 4.0, 6.0, 2.0, 5.0, 6.0, 8.0, 5.0, 5.0, 12.0, 19.0, 21.0, 32.0, 51.0, 64.0, 85.0, 93.0, 115.0, 126.0, 77.0, 63.0, 41.0, 29.0, 27.0, 20.0, 11.0, 12.0, 8.0, 7.0, 2.0, 4.0, 11.0, 4.0, 3.0, 2.0, 2.0, 3.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.003910064697265625, -0.0037894845008850098, -0.0036689043045043945, -0.0035483241081237793, -0.003427743911743164, -0.003307163715362549, -0.0031865835189819336, -0.0030660033226013184, -0.002945423126220703, -0.002824842929840088, -0.0027042627334594727, -0.0025836825370788574, -0.002463102340698242, -0.002342522144317627, -0.0022219419479370117, -0.0021013617515563965, -0.0019807815551757812, -0.001860201358795166, -0.0017396211624145508, -0.0016190409660339355, -0.0014984607696533203, -0.001377880573272705, -0.0012573003768920898, -0.0011367201805114746, -0.0010161399841308594, -0.0008955597877502441, -0.0007749795913696289, -0.0006543993949890137, -0.0005338191986083984, -0.0004132390022277832, -0.00029265880584716797, -0.00017207860946655273, -5.14984130859375e-05, 6.908178329467773e-05, 0.00018966197967529297, 0.0003102421760559082, 0.00043082237243652344, 0.0005514025688171387, 0.0006719827651977539, 0.0007925629615783691, 0.0009131431579589844, 0.0010337233543395996, 0.0011543035507202148, 0.00127488374710083, 0.0013954639434814453, 0.0015160441398620605, 0.0016366243362426758, 0.001757204532623291, 0.0018777847290039062, 0.0019983649253845215, 0.0021189451217651367, 0.002239525318145752, 0.002360105514526367, 0.0024806857109069824, 0.0026012659072875977, 0.002721846103668213, 0.002842426300048828, 0.0029630064964294434, 0.0030835866928100586, 0.003204166889190674, 0.003324747085571289, 0.0034453272819519043, 0.0035659074783325195, 0.0036864876747131348, 0.00380706787109375]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 8.0, 3.0, 6.0, 10.0, 8.0, 10.0, 24.0, 20.0, 30.0, 35.0, 36.0, 54.0, 61.0, 89.0, 104.0, 110.0, 73.0, 70.0, 48.0, 43.0, 29.0, 24.0, 28.0, 15.0, 15.0, 11.0, 12.0, 6.0, 5.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.248498797416687, -0.24071991443634033, -0.23294103145599365, -0.22516216337680817, -0.2173832803964615, -0.2096043974161148, -0.20182552933692932, -0.19404664635658264, -0.18626776337623596, -0.17848888039588928, -0.1707099974155426, -0.16293112933635712, -0.15515224635601044, -0.14737336337566376, -0.13959449529647827, -0.1318156123161316, -0.12403672933578491, -0.11625784635543823, -0.10847897082567215, -0.10070009529590607, -0.09292121231555939, -0.08514232933521271, -0.07736345380544662, -0.06958457827568054, -0.06180569529533386, -0.05402681604027748, -0.0462479367852211, -0.03846905753016472, -0.030690178275108337, -0.022911299020051956, -0.015132419764995575, -0.007353540509939194, 0.00042532384395599365, 0.008204203099012375, 0.015983082354068756, 0.023761961609125137, 0.03154084086418152, 0.0393197201192379, 0.04709859937429428, 0.05487747862935066, 0.06265635788440704, 0.07043524086475372, 0.0782141163945198, 0.08599299192428589, 0.09377187490463257, 0.10155075788497925, 0.10932963341474533, 0.11710850894451141, 0.1248873919248581, 0.13266627490520477, 0.14044514298439026, 0.14822402596473694, 0.15600290894508362, 0.1637817919254303, 0.17156067490577698, 0.17933954298496246, 0.18711842596530914, 0.19489730894565582, 0.2026761770248413, 0.210455060005188, 0.21823394298553467, 0.22601282596588135, 0.23379170894622803, 0.2415705770254135, 0.2493494600057602]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 7.0, 9.0, 5.0, 9.0, 9.0, 10.0, 13.0, 14.0, 22.0, 29.0, 25.0, 32.0, 32.0, 25.0, 32.0, 35.0, 30.0, 44.0, 33.0, 41.0, 45.0, 39.0, 46.0, 41.0, 27.0, 40.0, 36.0, 36.0, 27.0, 24.0, 27.0, 19.0, 28.0, 15.0, 20.0, 12.0, 17.0, 20.0, 9.0, 5.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.19703274965286255, -0.1913994550704956, -0.18576616048812866, -0.18013286590576172, -0.17449957132339478, -0.16886627674102783, -0.1632329821586609, -0.15759967267513275, -0.1519663780927658, -0.14633308351039886, -0.14069978892803192, -0.13506649434566498, -0.12943319976329803, -0.1237998977303505, -0.11816660314798355, -0.11253330111503601, -0.10690001398324966, -0.10126671940088272, -0.09563342481851578, -0.09000012278556824, -0.0843668282032013, -0.07873353362083435, -0.07310023903846741, -0.06746694445610046, -0.06183364614844322, -0.05620035156607628, -0.05056705325841904, -0.044933758676052094, -0.03930046409368515, -0.03366716578602791, -0.028033871203660965, -0.022400572896003723, -0.01676727831363678, -0.011133981868624687, -0.005500686354935169, 0.00013260915875434875, 0.005765905603766441, 0.011399202048778534, 0.017032496631145477, 0.02266579493880272, 0.028299089521169662, 0.033932384103536606, 0.03956568241119385, 0.04519897699356079, 0.050832271575927734, 0.056465569883584976, 0.06209886446595192, 0.06773216277360916, 0.0733654573559761, 0.07899875193834305, 0.08463204652070999, 0.09026534855365753, 0.09589864313602448, 0.10153193771839142, 0.10716523230075836, 0.1127985268831253, 0.11843182146549225, 0.12406511604785919, 0.12969841063022614, 0.13533170521259308, 0.14096499979496002, 0.14659830927848816, 0.1522316038608551, 0.15786489844322205, 0.163498193025589]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 6.0, 8.0, 12.0, 19.0, 28.0, 40.0, 63.0, 84.0, 152.0, 198.0, 293.0, 460.0, 705.0, 1003.0, 1627.0, 2549.0, 3868.0, 5957.0, 9236.0, 14340.0, 22870.0, 37900.0, 65743.0, 120298.0, 236404.0, 237257.0, 120247.0, 65551.0, 37910.0, 23146.0, 14497.0, 9018.0, 5889.0, 3844.0, 2494.0, 1699.0, 1103.0, 706.0, 428.0, 301.0, 204.0, 138.0, 96.0, 52.0, 41.0, 25.0, 22.0, 7.0, 5.0, 5.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.331787109375, -0.32141876220703125, -0.3110504150390625, -0.30068206787109375, -0.290313720703125, -0.27994537353515625, -0.2695770263671875, -0.25920867919921875, -0.24884033203125, -0.23847198486328125, -0.2281036376953125, -0.21773529052734375, -0.207366943359375, -0.19699859619140625, -0.1866302490234375, -0.17626190185546875, -0.1658935546875, -0.15552520751953125, -0.1451568603515625, -0.13478851318359375, -0.124420166015625, -0.11405181884765625, -0.1036834716796875, -0.09331512451171875, -0.08294677734375, -0.07257843017578125, -0.0622100830078125, -0.05184173583984375, -0.041473388671875, -0.03110504150390625, -0.0207366943359375, -0.01036834716796875, 0.0, 0.01036834716796875, 0.0207366943359375, 0.03110504150390625, 0.041473388671875, 0.05184173583984375, 0.0622100830078125, 0.07257843017578125, 0.08294677734375, 0.09331512451171875, 0.1036834716796875, 0.11405181884765625, 0.124420166015625, 0.13478851318359375, 0.1451568603515625, 0.15552520751953125, 0.1658935546875, 0.17626190185546875, 0.1866302490234375, 0.19699859619140625, 0.207366943359375, 0.21773529052734375, 0.2281036376953125, 0.23847198486328125, 0.24884033203125, 0.25920867919921875, 0.2695770263671875, 0.27994537353515625, 0.290313720703125, 0.30068206787109375, 0.3110504150390625, 0.32141876220703125, 0.331787109375]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 6.0, 13.0, 7.0, 9.0, 9.0, 16.0, 16.0, 19.0, 19.0, 34.0, 27.0, 21.0, 32.0, 26.0, 33.0, 42.0, 37.0, 46.0, 31.0, 35.0, 49.0, 54.0, 38.0, 29.0, 35.0, 39.0, 32.0, 36.0, 21.0, 24.0, 24.0, 29.0, 14.0, 14.0, 15.0, 20.0, 9.0, 14.0, 9.0, 8.0, 3.0, 4.0, 1.0, 4.0, 0.0, 1.0, 2.0], "bins": [-0.185546875, -0.18055343627929688, -0.17555999755859375, -0.17056655883789062, -0.1655731201171875, -0.16057968139648438, -0.15558624267578125, -0.15059280395507812, -0.145599365234375, -0.14060592651367188, -0.13561248779296875, -0.13061904907226562, -0.1256256103515625, -0.12063217163085938, -0.11563873291015625, -0.11064529418945312, -0.10565185546875, -0.10065841674804688, -0.09566497802734375, -0.09067153930664062, -0.0856781005859375, -0.08068466186523438, -0.07569122314453125, -0.07069778442382812, -0.065704345703125, -0.060710906982421875, -0.05571746826171875, -0.050724029541015625, -0.0457305908203125, -0.040737152099609375, -0.03574371337890625, -0.030750274658203125, -0.0257568359375, -0.020763397216796875, -0.01576995849609375, -0.010776519775390625, -0.0057830810546875, -0.000789642333984375, 0.00420379638671875, 0.009197235107421875, 0.014190673828125, 0.019184112548828125, 0.02417755126953125, 0.029170989990234375, 0.0341644287109375, 0.039157867431640625, 0.04415130615234375, 0.049144744873046875, 0.05413818359375, 0.059131622314453125, 0.06412506103515625, 0.06911849975585938, 0.0741119384765625, 0.07910537719726562, 0.08409881591796875, 0.08909225463867188, 0.094085693359375, 0.09907913208007812, 0.10407257080078125, 0.10906600952148438, 0.1140594482421875, 0.11905288696289062, 0.12404632568359375, 0.12903976440429688, 0.134033203125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 4.0, 13.0, 7.0, 14.0, 18.0, 19.0, 43.0, 47.0, 84.0, 150.0, 197.0, 309.0, 407.0, 683.0, 1007.0, 1521.0, 2342.0, 3719.0, 5771.0, 9382.0, 15126.0, 26049.0, 45164.0, 82649.0, 162644.0, 297032.0, 181227.0, 91119.0, 49800.0, 27933.0, 16610.0, 9966.0, 6189.0, 3893.0, 2588.0, 1600.0, 1082.0, 740.0, 442.0, 320.0, 224.0, 126.0, 99.0, 64.0, 52.0, 30.0, 20.0, 9.0, 13.0, 5.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.3232421875, -0.3123130798339844, -0.30138397216796875, -0.2904548645019531, -0.2795257568359375, -0.2685966491699219, -0.25766754150390625, -0.24673843383789062, -0.235809326171875, -0.22488021850585938, -0.21395111083984375, -0.20302200317382812, -0.1920928955078125, -0.18116378784179688, -0.17023468017578125, -0.15930557250976562, -0.14837646484375, -0.13744735717773438, -0.12651824951171875, -0.11558914184570312, -0.1046600341796875, -0.09373092651367188, -0.08280181884765625, -0.07187271118164062, -0.060943603515625, -0.050014495849609375, -0.03908538818359375, -0.028156280517578125, -0.0172271728515625, -0.006298065185546875, 0.00463104248046875, 0.015560150146484375, 0.0264892578125, 0.037418365478515625, 0.04834747314453125, 0.059276580810546875, 0.0702056884765625, 0.08113479614257812, 0.09206390380859375, 0.10299301147460938, 0.113922119140625, 0.12485122680664062, 0.13578033447265625, 0.14670944213867188, 0.1576385498046875, 0.16856765747070312, 0.17949676513671875, 0.19042587280273438, 0.20135498046875, 0.21228408813476562, 0.22321319580078125, 0.23414230346679688, 0.2450714111328125, 0.2560005187988281, 0.26692962646484375, 0.2778587341308594, 0.288787841796875, 0.2997169494628906, 0.31064605712890625, 0.3215751647949219, 0.3325042724609375, 0.3434333801269531, 0.35436248779296875, 0.3652915954589844, 0.376220703125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 4.0, 8.0, 9.0, 10.0, 8.0, 14.0, 22.0, 27.0, 21.0, 31.0, 28.0, 29.0, 43.0, 48.0, 34.0, 37.0, 39.0, 47.0, 42.0, 42.0, 44.0, 39.0, 44.0, 46.0, 33.0, 24.0, 28.0, 29.0, 28.0, 16.0, 20.0, 13.0, 23.0, 12.0, 13.0, 12.0, 8.0, 8.0, 2.0, 3.0, 7.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10321044921875, -0.0999135971069336, -0.09661674499511719, -0.09331989288330078, -0.09002304077148438, -0.08672618865966797, -0.08342933654785156, -0.08013248443603516, -0.07683563232421875, -0.07353878021240234, -0.07024192810058594, -0.06694507598876953, -0.06364822387695312, -0.06035137176513672, -0.05705451965332031, -0.053757667541503906, -0.0504608154296875, -0.047163963317871094, -0.04386711120605469, -0.04057025909423828, -0.037273406982421875, -0.03397655487060547, -0.030679702758789062, -0.027382850646972656, -0.02408599853515625, -0.020789146423339844, -0.017492294311523438, -0.014195442199707031, -0.010898590087890625, -0.007601737976074219, -0.0043048858642578125, -0.0010080337524414062, 0.002288818359375, 0.005585670471191406, 0.008882522583007812, 0.012179374694824219, 0.015476226806640625, 0.01877307891845703, 0.022069931030273438, 0.025366783142089844, 0.02866363525390625, 0.031960487365722656, 0.03525733947753906, 0.03855419158935547, 0.041851043701171875, 0.04514789581298828, 0.04844474792480469, 0.051741600036621094, 0.0550384521484375, 0.058335304260253906, 0.06163215637207031, 0.06492900848388672, 0.06822586059570312, 0.07152271270751953, 0.07481956481933594, 0.07811641693115234, 0.08141326904296875, 0.08471012115478516, 0.08800697326660156, 0.09130382537841797, 0.09460067749023438, 0.09789752960205078, 0.10119438171386719, 0.1044912338256836, 0.1077880859375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 8.0, 12.0, 17.0, 21.0, 34.0, 42.0, 58.0, 80.0, 83.0, 100.0, 147.0, 175.0, 260.0, 348.0, 430.0, 529.0, 665.0, 799.0, 1066.0, 1406.0, 1941.0, 2965.0, 5342.0, 17313.0, 891295.0, 98434.0, 10665.0, 4233.0, 2554.0, 1781.0, 1305.0, 995.0, 776.0, 607.0, 467.0, 327.0, 272.0, 238.0, 186.0, 140.0, 119.0, 83.0, 63.0, 50.0, 27.0, 32.0, 16.0, 13.0, 12.0, 14.0, 4.0, 5.0, 1.0, 2.0, 3.0], "bins": [-0.1318359375, -0.12793922424316406, -0.12404251098632812, -0.12014579772949219, -0.11624908447265625, -0.11235237121582031, -0.10845565795898438, -0.10455894470214844, -0.1006622314453125, -0.09676551818847656, -0.09286880493164062, -0.08897209167480469, -0.08507537841796875, -0.08117866516113281, -0.07728195190429688, -0.07338523864746094, -0.069488525390625, -0.06559181213378906, -0.061695098876953125, -0.05779838562011719, -0.05390167236328125, -0.05000495910644531, -0.046108245849609375, -0.04221153259277344, -0.0383148193359375, -0.03441810607910156, -0.030521392822265625, -0.026624679565429688, -0.02272796630859375, -0.018831253051757812, -0.014934539794921875, -0.011037826538085938, -0.00714111328125, -0.0032444000244140625, 0.000652313232421875, 0.0045490264892578125, 0.00844573974609375, 0.012342453002929688, 0.016239166259765625, 0.020135879516601562, 0.0240325927734375, 0.027929306030273438, 0.031826019287109375, 0.03572273254394531, 0.03961944580078125, 0.04351615905761719, 0.047412872314453125, 0.05130958557128906, 0.055206298828125, 0.05910301208496094, 0.06299972534179688, 0.06689643859863281, 0.07079315185546875, 0.07468986511230469, 0.07858657836914062, 0.08248329162597656, 0.0863800048828125, 0.09027671813964844, 0.09417343139648438, 0.09807014465332031, 0.10196685791015625, 0.10586357116699219, 0.10976028442382812, 0.11365699768066406, 0.1175537109375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 10.0, 8.0, 16.0, 10.0, 44.0, 110.0, 220.0, 120.0, 227.0, 114.0, 58.0, 15.0, 14.0, 6.0, 7.0, 2.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6954879760742188e-06, -3.591179847717285e-06, -3.4868717193603516e-06, -3.382563591003418e-06, -3.2782554626464844e-06, -3.1739473342895508e-06, -3.069639205932617e-06, -2.9653310775756836e-06, -2.86102294921875e-06, -2.7567148208618164e-06, -2.652406692504883e-06, -2.5480985641479492e-06, -2.4437904357910156e-06, -2.339482307434082e-06, -2.2351741790771484e-06, -2.130866050720215e-06, -2.0265579223632812e-06, -1.9222497940063477e-06, -1.817941665649414e-06, -1.7136335372924805e-06, -1.6093254089355469e-06, -1.5050172805786133e-06, -1.4007091522216797e-06, -1.296401023864746e-06, -1.1920928955078125e-06, -1.087784767150879e-06, -9.834766387939453e-07, -8.791685104370117e-07, -7.748603820800781e-07, -6.705522537231445e-07, -5.662441253662109e-07, -4.6193599700927734e-07, -3.5762786865234375e-07, -2.5331974029541016e-07, -1.4901161193847656e-07, -4.470348358154297e-08, 5.960464477539063e-08, 1.6391277313232422e-07, 2.682209014892578e-07, 3.725290298461914e-07, 4.76837158203125e-07, 5.811452865600586e-07, 6.854534149169922e-07, 7.897615432739258e-07, 8.940696716308594e-07, 9.98377799987793e-07, 1.1026859283447266e-06, 1.2069940567016602e-06, 1.3113021850585938e-06, 1.4156103134155273e-06, 1.519918441772461e-06, 1.6242265701293945e-06, 1.7285346984863281e-06, 1.8328428268432617e-06, 1.9371509552001953e-06, 2.041459083557129e-06, 2.1457672119140625e-06, 2.250075340270996e-06, 2.3543834686279297e-06, 2.4586915969848633e-06, 2.562999725341797e-06, 2.6673078536987305e-06, 2.771615982055664e-06, 2.8759241104125977e-06, 2.9802322387695312e-06]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 5.0, 9.0, 7.0, 8.0, 17.0, 30.0, 26.0, 44.0, 56.0, 87.0, 124.0, 154.0, 220.0, 314.0, 432.0, 659.0, 854.0, 1291.0, 1804.0, 2769.0, 4624.0, 14895.0, 867493.0, 130926.0, 9654.0, 3981.0, 2488.0, 1620.0, 1166.0, 804.0, 573.0, 389.0, 266.0, 222.0, 167.0, 109.0, 72.0, 43.0, 46.0, 35.0, 23.0, 11.0, 16.0, 5.0, 9.0, 5.0, 3.0, 0.0, 1.0, 2.0, 3.0], "bins": [-0.1552734375, -0.15094470977783203, -0.14661598205566406, -0.1422872543334961, -0.13795852661132812, -0.13362979888916016, -0.1293010711669922, -0.12497234344482422, -0.12064361572265625, -0.11631488800048828, -0.11198616027832031, -0.10765743255615234, -0.10332870483398438, -0.0989999771118164, -0.09467124938964844, -0.09034252166748047, -0.0860137939453125, -0.08168506622314453, -0.07735633850097656, -0.0730276107788086, -0.06869888305664062, -0.06437015533447266, -0.06004142761230469, -0.05571269989013672, -0.05138397216796875, -0.04705524444580078, -0.04272651672363281, -0.038397789001464844, -0.034069061279296875, -0.029740333557128906, -0.025411605834960938, -0.02108287811279297, -0.016754150390625, -0.012425422668457031, -0.008096694946289062, -0.0037679672241210938, 0.000560760498046875, 0.004889488220214844, 0.009218215942382812, 0.013546943664550781, 0.01787567138671875, 0.02220439910888672, 0.026533126831054688, 0.030861854553222656, 0.035190582275390625, 0.039519309997558594, 0.04384803771972656, 0.04817676544189453, 0.0525054931640625, 0.05683422088623047, 0.06116294860839844, 0.0654916763305664, 0.06982040405273438, 0.07414913177490234, 0.07847785949707031, 0.08280658721923828, 0.08713531494140625, 0.09146404266357422, 0.09579277038574219, 0.10012149810791016, 0.10445022583007812, 0.1087789535522461, 0.11310768127441406, 0.11743640899658203, 0.12176513671875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 6.0, 24.0, 56.0, 193.0, 595.0, 72.0, 21.0, 7.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034515380859375, -0.03328895568847656, -0.032062530517578125, -0.030836105346679688, -0.02960968017578125, -0.028383255004882812, -0.027156829833984375, -0.025930404663085938, -0.0247039794921875, -0.023477554321289062, -0.022251129150390625, -0.021024703979492188, -0.01979827880859375, -0.018571853637695312, -0.017345428466796875, -0.016119003295898438, -0.014892578125, -0.013666152954101562, -0.012439727783203125, -0.011213302612304688, -0.00998687744140625, -0.008760452270507812, -0.007534027099609375, -0.0063076019287109375, -0.0050811767578125, -0.0038547515869140625, -0.002628326416015625, -0.0014019012451171875, -0.00017547607421875, 0.0010509490966796875, 0.002277374267578125, 0.0035037994384765625, 0.004730224609375, 0.0059566497802734375, 0.007183074951171875, 0.008409500122070312, 0.00963592529296875, 0.010862350463867188, 0.012088775634765625, 0.013315200805664062, 0.0145416259765625, 0.015768051147460938, 0.016994476318359375, 0.018220901489257812, 0.01944732666015625, 0.020673751831054688, 0.021900177001953125, 0.023126602172851562, 0.02435302734375, 0.025579452514648438, 0.026805877685546875, 0.028032302856445312, 0.02925872802734375, 0.030485153198242188, 0.031711578369140625, 0.03293800354003906, 0.0341644287109375, 0.03539085388183594, 0.036617279052734375, 0.03784370422363281, 0.03907012939453125, 0.04029655456542969, 0.041522979736328125, 0.04274940490722656, 0.043975830078125]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 4.0, 10.0, 8.0, 13.0, 14.0, 19.0, 18.0, 21.0, 35.0, 53.0, 69.0, 80.0, 114.0, 110.0, 111.0, 68.0, 47.0, 54.0, 36.0, 25.0, 15.0, 18.0, 20.0, 8.0, 8.0, 8.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.30425775051116943, -0.2961089015007019, -0.28796008229255676, -0.27981123328208923, -0.2716623842716217, -0.26351356506347656, -0.25536471605300903, -0.2472158670425415, -0.23906703293323517, -0.23091819882392883, -0.2227693498134613, -0.21462051570415497, -0.20647168159484863, -0.1983228325843811, -0.19017399847507477, -0.18202516436576843, -0.1738763153553009, -0.16572748124599457, -0.15757863223552704, -0.1494297981262207, -0.14128094911575317, -0.13313211500644684, -0.1249832808971405, -0.11683443933725357, -0.10868559777736664, -0.1005367562174797, -0.09238791465759277, -0.08423908054828644, -0.0760902389883995, -0.06794139742851257, -0.05979255959391594, -0.051643721759319305, -0.04349489510059357, -0.035346053540706635, -0.02719721570611, -0.019048376008868217, -0.010899536311626434, -0.002750694751739502, 0.005398143082857132, 0.013546980917453766, 0.021695822477340698, 0.02984466217458248, 0.037993501871824265, 0.0461423397064209, 0.05429118126630783, 0.06244002282619476, 0.0705888569355011, 0.07873769849538803, 0.08688654005527496, 0.0950353816151619, 0.10318422317504883, 0.11133305728435516, 0.1194818988442421, 0.12763074040412903, 0.13577957451343536, 0.1439284086227417, 0.15207725763320923, 0.16022609174251556, 0.1683749407529831, 0.17652377486228943, 0.18467262387275696, 0.1928214579820633, 0.20097029209136963, 0.20911914110183716, 0.2172679752111435]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 4.0, 3.0, 6.0, 4.0, 9.0, 8.0, 13.0, 11.0, 13.0, 18.0, 17.0, 24.0, 23.0, 27.0, 30.0, 27.0, 35.0, 28.0, 35.0, 40.0, 26.0, 35.0, 42.0, 34.0, 43.0, 38.0, 32.0, 38.0, 43.0, 35.0, 23.0, 25.0, 32.0, 19.0, 31.0, 19.0, 20.0, 15.0, 21.0, 9.0, 8.0, 11.0, 5.0, 9.0, 9.0, 2.0, 4.0, 0.0, 1.0, 3.0, 3.0, 1.0], "bins": [-0.17656075954437256, -0.1715831458568573, -0.16660553216934204, -0.1616279035806656, -0.15665028989315033, -0.15167267620563507, -0.1466950625181198, -0.14171744883060455, -0.1367398202419281, -0.13176220655441284, -0.12678459286689758, -0.12180697172880173, -0.11682935059070587, -0.11185173690319061, -0.10687412321567535, -0.1018965095281601, -0.09691889584064484, -0.09194128215312958, -0.08696366101503372, -0.08198604732751846, -0.07700842618942261, -0.07203081250190735, -0.06705319881439209, -0.06207558140158653, -0.057097963988780975, -0.05212034657597542, -0.04714272916316986, -0.0421651154756546, -0.037187498062849045, -0.03220988065004349, -0.02723226509988308, -0.02225464954972267, -0.01727701723575592, -0.012299400754272938, -0.007321784272789955, -0.0023441677913069725, 0.00263344869017601, 0.007611066102981567, 0.012588681653141975, 0.017566297203302383, 0.02254391461610794, 0.027521532028913498, 0.032499149441719055, 0.037476763129234314, 0.04245438054203987, 0.04743199795484543, 0.05240961164236069, 0.057387229055166245, 0.0623648464679718, 0.06734246015548706, 0.07232008129358292, 0.07729769498109818, 0.08227531611919403, 0.08725292980670929, 0.09223054349422455, 0.09720815718173981, 0.10218577831983566, 0.10716339200735092, 0.11214101314544678, 0.11711862683296204, 0.1220962405204773, 0.12707385420799255, 0.132051482796669, 0.13702909648418427, 0.14200671017169952]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 12.0, 14.0, 21.0, 24.0, 54.0, 62.0, 108.0, 147.0, 222.0, 355.0, 572.0, 929.0, 1429.0, 2388.0, 3818.0, 6490.0, 10669.0, 18535.0, 32967.0, 62860.0, 128053.0, 318160.0, 1405482.0, 1565846.0, 351229.0, 136422.0, 66232.0, 34787.0, 19097.0, 11052.0, 6422.0, 3843.0, 2246.0, 1453.0, 855.0, 544.0, 323.0, 220.0, 130.0, 81.0, 46.0, 21.0, 16.0, 13.0, 12.0, 6.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.287841796875, -0.2793846130371094, -0.27092742919921875, -0.2624702453613281, -0.2540130615234375, -0.24555587768554688, -0.23709869384765625, -0.22864151000976562, -0.220184326171875, -0.21172714233398438, -0.20326995849609375, -0.19481277465820312, -0.1863555908203125, -0.17789840698242188, -0.16944122314453125, -0.16098403930664062, -0.15252685546875, -0.14406967163085938, -0.13561248779296875, -0.12715530395507812, -0.1186981201171875, -0.11024093627929688, -0.10178375244140625, -0.09332656860351562, -0.084869384765625, -0.07641220092773438, -0.06795501708984375, -0.059497833251953125, -0.0510406494140625, -0.042583465576171875, -0.03412628173828125, -0.025669097900390625, -0.0172119140625, -0.008754730224609375, -0.00029754638671875, 0.008159637451171875, 0.0166168212890625, 0.025074005126953125, 0.03353118896484375, 0.041988372802734375, 0.050445556640625, 0.058902740478515625, 0.06735992431640625, 0.07581710815429688, 0.0842742919921875, 0.09273147583007812, 0.10118865966796875, 0.10964584350585938, 0.11810302734375, 0.12656021118164062, 0.13501739501953125, 0.14347457885742188, 0.1519317626953125, 0.16038894653320312, 0.16884613037109375, 0.17730331420898438, 0.185760498046875, 0.19421768188476562, 0.20267486572265625, 0.21113204956054688, 0.2195892333984375, 0.22804641723632812, 0.23650360107421875, 0.24496078491210938, 0.25341796875]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 7.0, 1.0, 8.0, 4.0, 7.0, 4.0, 12.0, 15.0, 14.0, 9.0, 17.0, 15.0, 28.0, 25.0, 33.0, 35.0, 31.0, 28.0, 26.0, 29.0, 36.0, 35.0, 38.0, 50.0, 36.0, 33.0, 31.0, 37.0, 40.0, 43.0, 34.0, 24.0, 22.0, 26.0, 22.0, 35.0, 15.0, 13.0, 11.0, 12.0, 7.0, 13.0, 5.0, 13.0, 6.0, 7.0, 6.0, 5.0, 1.0, 1.0, 0.0, 5.0], "bins": [-0.1044921875, -0.10157012939453125, -0.0986480712890625, -0.09572601318359375, -0.092803955078125, -0.08988189697265625, -0.0869598388671875, -0.08403778076171875, -0.08111572265625, -0.07819366455078125, -0.0752716064453125, -0.07234954833984375, -0.069427490234375, -0.06650543212890625, -0.0635833740234375, -0.06066131591796875, -0.0577392578125, -0.05481719970703125, -0.0518951416015625, -0.04897308349609375, -0.046051025390625, -0.04312896728515625, -0.0402069091796875, -0.03728485107421875, -0.03436279296875, -0.03144073486328125, -0.0285186767578125, -0.02559661865234375, -0.022674560546875, -0.01975250244140625, -0.0168304443359375, -0.01390838623046875, -0.010986328125, -0.00806427001953125, -0.0051422119140625, -0.00222015380859375, 0.000701904296875, 0.00362396240234375, 0.0065460205078125, 0.00946807861328125, 0.01239013671875, 0.01531219482421875, 0.0182342529296875, 0.02115631103515625, 0.024078369140625, 0.02700042724609375, 0.0299224853515625, 0.03284454345703125, 0.0357666015625, 0.03868865966796875, 0.0416107177734375, 0.04453277587890625, 0.047454833984375, 0.05037689208984375, 0.0532989501953125, 0.05622100830078125, 0.05914306640625, 0.06206512451171875, 0.0649871826171875, 0.06790924072265625, 0.070831298828125, 0.07375335693359375, 0.0766754150390625, 0.07959747314453125, 0.08251953125]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 5.0, 0.0, 4.0, 5.0, 11.0, 18.0, 28.0, 27.0, 46.0, 66.0, 96.0, 146.0, 211.0, 375.0, 532.0, 825.0, 1326.0, 2138.0, 3395.0, 5723.0, 9488.0, 16058.0, 27773.0, 49998.0, 91495.0, 178598.0, 384664.0, 1050440.0, 1413018.0, 491503.0, 218435.0, 109816.0, 58653.0, 32255.0, 18777.0, 11023.0, 6609.0, 4024.0, 2470.0, 1523.0, 996.0, 645.0, 370.0, 222.0, 154.0, 102.0, 74.0, 40.0, 39.0, 17.0, 13.0, 9.0, 7.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1766357421875, -0.17096328735351562, -0.16529083251953125, -0.15961837768554688, -0.1539459228515625, -0.14827346801757812, -0.14260101318359375, -0.13692855834960938, -0.131256103515625, -0.12558364868164062, -0.11991119384765625, -0.11423873901367188, -0.1085662841796875, -0.10289382934570312, -0.09722137451171875, -0.09154891967773438, -0.08587646484375, -0.08020401000976562, -0.07453155517578125, -0.06885910034179688, -0.0631866455078125, -0.057514190673828125, -0.05184173583984375, -0.046169281005859375, -0.040496826171875, -0.034824371337890625, -0.02915191650390625, -0.023479461669921875, -0.0178070068359375, -0.012134552001953125, -0.00646209716796875, -0.000789642333984375, 0.0048828125, 0.010555267333984375, 0.01622772216796875, 0.021900177001953125, 0.0275726318359375, 0.033245086669921875, 0.03891754150390625, 0.044589996337890625, 0.050262451171875, 0.055934906005859375, 0.06160736083984375, 0.06727981567382812, 0.0729522705078125, 0.07862472534179688, 0.08429718017578125, 0.08996963500976562, 0.09564208984375, 0.10131454467773438, 0.10698699951171875, 0.11265945434570312, 0.1183319091796875, 0.12400436401367188, 0.12967681884765625, 0.13534927368164062, 0.141021728515625, 0.14669418334960938, 0.15236663818359375, 0.15803909301757812, 0.1637115478515625, 0.16938400268554688, 0.17505645751953125, 0.18072891235351562, 0.1864013671875]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 11.0, 16.0, 18.0, 22.0, 27.0, 37.0, 36.0, 61.0, 78.0, 79.0, 82.0, 114.0, 136.0, 141.0, 180.0, 198.0, 272.0, 266.0, 287.0, 313.0, 273.0, 239.0, 188.0, 164.0, 146.0, 132.0, 97.0, 75.0, 98.0, 58.0, 38.0, 42.0, 47.0, 18.0, 12.0, 24.0, 9.0, 14.0, 7.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.051849365234375, -0.050127506256103516, -0.04840564727783203, -0.04668378829956055, -0.04496192932128906, -0.04324007034301758, -0.041518211364746094, -0.03979635238647461, -0.038074493408203125, -0.03635263442993164, -0.034630775451660156, -0.03290891647338867, -0.031187057495117188, -0.029465198516845703, -0.02774333953857422, -0.026021480560302734, -0.02429962158203125, -0.022577762603759766, -0.02085590362548828, -0.019134044647216797, -0.017412185668945312, -0.015690326690673828, -0.013968467712402344, -0.01224660873413086, -0.010524749755859375, -0.00880289077758789, -0.007081031799316406, -0.005359172821044922, -0.0036373138427734375, -0.0019154548645019531, -0.00019359588623046875, 0.0015282630920410156, 0.0032501220703125, 0.004971981048583984, 0.006693840026855469, 0.008415699005126953, 0.010137557983398438, 0.011859416961669922, 0.013581275939941406, 0.01530313491821289, 0.017024993896484375, 0.01874685287475586, 0.020468711853027344, 0.022190570831298828, 0.023912429809570312, 0.025634288787841797, 0.02735614776611328, 0.029078006744384766, 0.03079986572265625, 0.032521724700927734, 0.03424358367919922, 0.0359654426574707, 0.03768730163574219, 0.03940916061401367, 0.041131019592285156, 0.04285287857055664, 0.044574737548828125, 0.04629659652709961, 0.048018455505371094, 0.04974031448364258, 0.05146217346191406, 0.05318403244018555, 0.05490589141845703, 0.056627750396728516, 0.058349609375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 1.0, 4.0, 4.0, 8.0, 10.0, 7.0, 11.0, 15.0, 16.0, 18.0, 31.0, 31.0, 39.0, 48.0, 56.0, 68.0, 86.0, 80.0, 71.0, 68.0, 55.0, 48.0, 32.0, 35.0, 25.0, 22.0, 19.0, 12.0, 14.0, 11.0, 13.0, 9.0, 6.0, 5.0, 3.0, 1.0, 7.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.14652322232723236, -0.14243143796920776, -0.13833963871002197, -0.13424783945083618, -0.13015605509281158, -0.126064270734787, -0.1219724714756012, -0.117880679666996, -0.11378888785839081, -0.10969709604978561, -0.10560530424118042, -0.10151351243257523, -0.09742172062397003, -0.09332992881536484, -0.08923813700675964, -0.08514634519815445, -0.08105455338954926, -0.07696276158094406, -0.07287096977233887, -0.06877917796373367, -0.06468738615512848, -0.060595594346523285, -0.05650380253791809, -0.0524120107293129, -0.0483202189207077, -0.04422842711210251, -0.040136635303497314, -0.03604484349489212, -0.031953051686286926, -0.027861259877681732, -0.023769468069076538, -0.019677676260471344, -0.015585869550704956, -0.011494077742099762, -0.007402285933494568, -0.0033104941248893738, 0.0007812976837158203, 0.004873089492321014, 0.008964881300926208, 0.013056673109531403, 0.017148464918136597, 0.02124025672674179, 0.025332048535346985, 0.02942384034395218, 0.03351563215255737, 0.03760742396116257, 0.04169921576976776, 0.045791007578372955, 0.04988279938697815, 0.053974591195583344, 0.05806638300418854, 0.06215817481279373, 0.06624996662139893, 0.07034175843000412, 0.07443355023860931, 0.07852534204721451, 0.0826171338558197, 0.0867089256644249, 0.09080071747303009, 0.09489250928163528, 0.09898430109024048, 0.10307609289884567, 0.10716788470745087, 0.11125967651605606, 0.11535146832466125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 3.0, 6.0, 7.0, 6.0, 9.0, 8.0, 14.0, 14.0, 17.0, 30.0, 28.0, 25.0, 30.0, 33.0, 29.0, 33.0, 33.0, 34.0, 42.0, 38.0, 34.0, 33.0, 40.0, 31.0, 38.0, 36.0, 44.0, 34.0, 34.0, 24.0, 28.0, 23.0, 20.0, 23.0, 22.0, 15.0, 15.0, 10.0, 16.0, 13.0, 6.0, 6.0, 7.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10319755971431732, -0.09983530640602112, -0.09647306054830551, -0.09311080724000931, -0.0897485613822937, -0.0863863080739975, -0.0830240547657013, -0.07966180145740509, -0.07629955559968948, -0.07293730229139328, -0.06957505643367767, -0.06621280312538147, -0.06285054981708527, -0.05948830395936966, -0.056126050651073456, -0.05276380106806755, -0.049401551485061646, -0.04603930190205574, -0.042677052319049835, -0.03931479901075363, -0.035952549427747726, -0.03259029984474182, -0.029228048399090767, -0.025865796953439713, -0.022503547370433807, -0.019141297787427902, -0.015779046341776848, -0.012416795827448368, -0.009054545313119888, -0.005692295730113983, -0.0023300442844629288, 0.0010322071611881256, 0.004394456744194031, 0.0077567072585225105, 0.01111895777285099, 0.01448120828717947, 0.01784345880150795, 0.021205708384513855, 0.02456795983016491, 0.027930211275815964, 0.03129246085882187, 0.034654710441827774, 0.03801696002483368, 0.04137921333312988, 0.04474146291613579, 0.04810371249914169, 0.0514659658074379, 0.0548282153904438, 0.05819046497344971, 0.06155271455645561, 0.06491496413946152, 0.06827721744775772, 0.07163946330547333, 0.07500171661376953, 0.07836396992206573, 0.08172622323036194, 0.08508846908807755, 0.08845072239637375, 0.09181296825408936, 0.09517522156238556, 0.09853747487068176, 0.10189972072839737, 0.10526197403669357, 0.10862421989440918, 0.11198647320270538]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 5.0, 7.0, 6.0, 15.0, 13.0, 30.0, 47.0, 63.0, 90.0, 118.0, 211.0, 309.0, 514.0, 748.0, 1154.0, 1678.0, 2585.0, 3876.0, 6093.0, 9526.0, 15449.0, 25904.0, 45872.0, 86927.0, 183131.0, 312016.0, 165574.0, 79312.0, 42478.0, 24448.0, 14575.0, 8981.0, 5805.0, 3797.0, 2500.0, 1582.0, 1037.0, 684.0, 438.0, 318.0, 188.0, 160.0, 94.0, 68.0, 39.0, 37.0, 22.0, 11.0, 13.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0716552734375, -0.06951236724853516, -0.06736946105957031, -0.06522655487060547, -0.06308364868164062, -0.06094074249267578, -0.05879783630371094, -0.056654930114746094, -0.05451202392578125, -0.052369117736816406, -0.05022621154785156, -0.04808330535888672, -0.045940399169921875, -0.04379749298095703, -0.04165458679199219, -0.039511680603027344, -0.0373687744140625, -0.035225868225097656, -0.03308296203613281, -0.03094005584716797, -0.028797149658203125, -0.02665424346923828, -0.024511337280273438, -0.022368431091308594, -0.02022552490234375, -0.018082618713378906, -0.015939712524414062, -0.013796806335449219, -0.011653900146484375, -0.009510993957519531, -0.0073680877685546875, -0.005225181579589844, -0.003082275390625, -0.0009393692016601562, 0.0012035369873046875, 0.0033464431762695312, 0.005489349365234375, 0.007632255554199219, 0.009775161743164062, 0.011918067932128906, 0.01406097412109375, 0.016203880310058594, 0.018346786499023438, 0.02048969268798828, 0.022632598876953125, 0.02477550506591797, 0.026918411254882812, 0.029061317443847656, 0.0312042236328125, 0.033347129821777344, 0.03549003601074219, 0.03763294219970703, 0.039775848388671875, 0.04191875457763672, 0.04406166076660156, 0.046204566955566406, 0.04834747314453125, 0.050490379333496094, 0.05263328552246094, 0.05477619171142578, 0.056919097900390625, 0.05906200408935547, 0.06120491027832031, 0.06334781646728516, 0.06549072265625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 6.0, 4.0, 3.0, 5.0, 8.0, 10.0, 14.0, 16.0, 17.0, 26.0, 27.0, 32.0, 28.0, 26.0, 31.0, 40.0, 42.0, 30.0, 42.0, 40.0, 46.0, 36.0, 37.0, 34.0, 44.0, 39.0, 46.0, 30.0, 25.0, 24.0, 25.0, 22.0, 21.0, 24.0, 12.0, 20.0, 10.0, 9.0, 12.0, 14.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.110107421875, -0.10659122467041016, -0.10307502746582031, -0.09955883026123047, -0.09604263305664062, -0.09252643585205078, -0.08901023864746094, -0.0854940414428711, -0.08197784423828125, -0.0784616470336914, -0.07494544982910156, -0.07142925262451172, -0.06791305541992188, -0.06439685821533203, -0.06088066101074219, -0.057364463806152344, -0.0538482666015625, -0.050332069396972656, -0.04681587219238281, -0.04329967498779297, -0.039783477783203125, -0.03626728057861328, -0.03275108337402344, -0.029234886169433594, -0.02571868896484375, -0.022202491760253906, -0.018686294555664062, -0.015170097351074219, -0.011653900146484375, -0.008137702941894531, -0.0046215057373046875, -0.0011053085327148438, 0.002410888671875, 0.005927085876464844, 0.009443283081054688, 0.012959480285644531, 0.016475677490234375, 0.01999187469482422, 0.023508071899414062, 0.027024269104003906, 0.03054046630859375, 0.034056663513183594, 0.03757286071777344, 0.04108905792236328, 0.044605255126953125, 0.04812145233154297, 0.05163764953613281, 0.055153846740722656, 0.0586700439453125, 0.062186241149902344, 0.06570243835449219, 0.06921863555908203, 0.07273483276367188, 0.07625102996826172, 0.07976722717285156, 0.0832834243774414, 0.08679962158203125, 0.0903158187866211, 0.09383201599121094, 0.09734821319580078, 0.10086441040039062, 0.10438060760498047, 0.10789680480957031, 0.11141300201416016, 0.11492919921875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 9.0, 10.0, 22.0, 28.0, 41.0, 46.0, 56.0, 78.0, 125.0, 142.0, 251.0, 320.0, 436.0, 639.0, 903.0, 1380.0, 2008.0, 3099.0, 5112.0, 8898.0, 16826.0, 39598.0, 130042.0, 518025.0, 214056.0, 56828.0, 21662.0, 10857.0, 5992.0, 3515.0, 2399.0, 1592.0, 1017.0, 698.0, 524.0, 422.0, 260.0, 173.0, 127.0, 95.0, 70.0, 45.0, 36.0, 31.0, 15.0, 15.0, 14.0, 6.0, 2.0, 1.0, 6.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.107666015625, -0.10426616668701172, -0.10086631774902344, -0.09746646881103516, -0.09406661987304688, -0.0906667709350586, -0.08726692199707031, -0.08386707305908203, -0.08046722412109375, -0.07706737518310547, -0.07366752624511719, -0.0702676773071289, -0.06686782836914062, -0.06346797943115234, -0.06006813049316406, -0.05666828155517578, -0.0532684326171875, -0.04986858367919922, -0.04646873474121094, -0.043068885803222656, -0.039669036865234375, -0.036269187927246094, -0.03286933898925781, -0.02946949005126953, -0.02606964111328125, -0.02266979217529297, -0.019269943237304688, -0.015870094299316406, -0.012470245361328125, -0.009070396423339844, -0.0056705474853515625, -0.0022706985473632812, 0.001129150390625, 0.004528999328613281, 0.007928848266601562, 0.011328697204589844, 0.014728546142578125, 0.018128395080566406, 0.021528244018554688, 0.02492809295654297, 0.02832794189453125, 0.03172779083251953, 0.03512763977050781, 0.038527488708496094, 0.041927337646484375, 0.045327186584472656, 0.04872703552246094, 0.05212688446044922, 0.0555267333984375, 0.05892658233642578, 0.06232643127441406, 0.06572628021240234, 0.06912612915039062, 0.0725259780883789, 0.07592582702636719, 0.07932567596435547, 0.08272552490234375, 0.08612537384033203, 0.08952522277832031, 0.0929250717163086, 0.09632492065429688, 0.09972476959228516, 0.10312461853027344, 0.10652446746826172, 0.10992431640625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 4.0, 9.0, 4.0, 7.0, 10.0, 11.0, 12.0, 21.0, 23.0, 19.0, 34.0, 33.0, 33.0, 31.0, 39.0, 36.0, 40.0, 39.0, 52.0, 42.0, 46.0, 52.0, 33.0, 39.0, 43.0, 37.0, 34.0, 35.0, 27.0, 28.0, 23.0, 18.0, 21.0, 14.0, 7.0, 14.0, 11.0, 7.0, 6.0, 6.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07696533203125, -0.07450485229492188, -0.07204437255859375, -0.06958389282226562, -0.0671234130859375, -0.06466293334960938, -0.06220245361328125, -0.059741973876953125, -0.057281494140625, -0.054821014404296875, -0.05236053466796875, -0.049900054931640625, -0.0474395751953125, -0.044979095458984375, -0.04251861572265625, -0.040058135986328125, -0.03759765625, -0.035137176513671875, -0.03267669677734375, -0.030216217041015625, -0.0277557373046875, -0.025295257568359375, -0.02283477783203125, -0.020374298095703125, -0.017913818359375, -0.015453338623046875, -0.01299285888671875, -0.010532379150390625, -0.0080718994140625, -0.005611419677734375, -0.00315093994140625, -0.000690460205078125, 0.00177001953125, 0.004230499267578125, 0.00669097900390625, 0.009151458740234375, 0.0116119384765625, 0.014072418212890625, 0.01653289794921875, 0.018993377685546875, 0.021453857421875, 0.023914337158203125, 0.02637481689453125, 0.028835296630859375, 0.0312957763671875, 0.033756256103515625, 0.03621673583984375, 0.038677215576171875, 0.0411376953125, 0.043598175048828125, 0.04605865478515625, 0.048519134521484375, 0.0509796142578125, 0.053440093994140625, 0.05590057373046875, 0.058361053466796875, 0.060821533203125, 0.06328201293945312, 0.06574249267578125, 0.06820297241210938, 0.0706634521484375, 0.07312393188476562, 0.07558441162109375, 0.07804489135742188, 0.08050537109375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 9.0, 4.0, 14.0, 18.0, 13.0, 17.0, 23.0, 28.0, 36.0, 49.0, 73.0, 110.0, 148.0, 196.0, 323.0, 545.0, 894.0, 1436.0, 2692.0, 5504.0, 13205.0, 41994.0, 318985.0, 579093.0, 54103.0, 15581.0, 6202.0, 3054.0, 1572.0, 871.0, 570.0, 372.0, 222.0, 168.0, 108.0, 83.0, 73.0, 46.0, 35.0, 27.0, 9.0, 19.0, 9.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00958251953125, -0.00925302505493164, -0.008923530578613281, -0.008594036102294922, -0.008264541625976562, -0.007935047149658203, -0.007605552673339844, -0.007276058197021484, -0.006946563720703125, -0.006617069244384766, -0.006287574768066406, -0.005958080291748047, -0.0056285858154296875, -0.005299091339111328, -0.004969596862792969, -0.004640102386474609, -0.00431060791015625, -0.003981113433837891, -0.0036516189575195312, -0.003322124481201172, -0.0029926300048828125, -0.002663135528564453, -0.0023336410522460938, -0.0020041465759277344, -0.001674652099609375, -0.0013451576232910156, -0.0010156631469726562, -0.0006861686706542969, -0.0003566741943359375, -2.7179718017578125e-05, 0.00030231475830078125, 0.0006318092346191406, 0.0009613037109375, 0.0012907981872558594, 0.0016202926635742188, 0.0019497871398925781, 0.0022792816162109375, 0.002608776092529297, 0.0029382705688476562, 0.0032677650451660156, 0.003597259521484375, 0.003926753997802734, 0.004256248474121094, 0.004585742950439453, 0.0049152374267578125, 0.005244731903076172, 0.005574226379394531, 0.005903720855712891, 0.00623321533203125, 0.006562709808349609, 0.006892204284667969, 0.007221698760986328, 0.0075511932373046875, 0.007880687713623047, 0.008210182189941406, 0.008539676666259766, 0.008869171142578125, 0.009198665618896484, 0.009528160095214844, 0.009857654571533203, 0.010187149047851562, 0.010516643524169922, 0.010846138000488281, 0.01117563247680664, 0.011505126953125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 7.0, 0.0, 4.0, 6.0, 0.0, 7.0, 16.0, 0.0, 24.0, 0.0, 23.0, 28.0, 0.0, 43.0, 67.0, 0.0, 68.0, 0.0, 86.0, 80.0, 0.0, 93.0, 106.0, 0.0, 86.0, 0.0, 68.0, 49.0, 0.0, 45.0, 23.0, 0.0, 27.0, 0.0, 12.0, 23.0, 0.0, 9.0, 6.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0132789611816406e-06, -9.760260581970215e-07, -9.387731552124023e-07, -9.015202522277832e-07, -8.642673492431641e-07, -8.270144462585449e-07, -7.897615432739258e-07, -7.525086402893066e-07, -7.152557373046875e-07, -6.780028343200684e-07, -6.407499313354492e-07, -6.034970283508301e-07, -5.662441253662109e-07, -5.289912223815918e-07, -4.917383193969727e-07, -4.544854164123535e-07, -4.172325134277344e-07, -3.7997961044311523e-07, -3.427267074584961e-07, -3.0547380447387695e-07, -2.682209014892578e-07, -2.3096799850463867e-07, -1.9371509552001953e-07, -1.564621925354004e-07, -1.1920928955078125e-07, -8.195638656616211e-08, -4.470348358154297e-08, -7.450580596923828e-09, 2.9802322387695312e-08, 6.705522537231445e-08, 1.043081283569336e-07, 1.4156103134155273e-07, 1.7881393432617188e-07, 2.1606683731079102e-07, 2.5331974029541016e-07, 2.905726432800293e-07, 3.2782554626464844e-07, 3.650784492492676e-07, 4.023313522338867e-07, 4.3958425521850586e-07, 4.76837158203125e-07, 5.140900611877441e-07, 5.513429641723633e-07, 5.885958671569824e-07, 6.258487701416016e-07, 6.631016731262207e-07, 7.003545761108398e-07, 7.37607479095459e-07, 7.748603820800781e-07, 8.121132850646973e-07, 8.493661880493164e-07, 8.866190910339355e-07, 9.238719940185547e-07, 9.611248970031738e-07, 9.98377799987793e-07, 1.0356307029724121e-06, 1.0728836059570312e-06, 1.1101365089416504e-06, 1.1473894119262695e-06, 1.1846423149108887e-06, 1.2218952178955078e-06, 1.259148120880127e-06, 1.296401023864746e-06, 1.3336539268493652e-06, 1.3709068298339844e-06]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 6.0, 9.0, 11.0, 10.0, 17.0, 25.0, 37.0, 35.0, 72.0, 78.0, 130.0, 171.0, 203.0, 336.0, 466.0, 673.0, 1022.0, 1473.0, 2245.0, 3544.0, 6127.0, 11428.0, 24149.0, 64608.0, 268885.0, 497059.0, 98438.0, 32865.0, 14604.0, 7492.0, 4267.0, 2611.0, 1738.0, 1157.0, 745.0, 536.0, 370.0, 240.0, 181.0, 134.0, 97.0, 67.0, 58.0, 45.0, 35.0, 20.0, 17.0, 6.0, 8.0, 5.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.00916290283203125, -0.00888669490814209, -0.00861048698425293, -0.00833427906036377, -0.00805807113647461, -0.007781863212585449, -0.007505655288696289, -0.007229447364807129, -0.006953239440917969, -0.006677031517028809, -0.0064008235931396484, -0.006124615669250488, -0.005848407745361328, -0.005572199821472168, -0.005295991897583008, -0.005019783973693848, -0.0047435760498046875, -0.004467368125915527, -0.004191160202026367, -0.003914952278137207, -0.003638744354248047, -0.0033625364303588867, -0.0030863285064697266, -0.0028101205825805664, -0.0025339126586914062, -0.002257704734802246, -0.001981496810913086, -0.0017052888870239258, -0.0014290809631347656, -0.0011528730392456055, -0.0008766651153564453, -0.0006004571914672852, -0.000324249267578125, -4.8041343688964844e-05, 0.0002281665802001953, 0.0005043745040893555, 0.0007805824279785156, 0.0010567903518676758, 0.001332998275756836, 0.001609206199645996, 0.0018854141235351562, 0.0021616220474243164, 0.0024378299713134766, 0.0027140378952026367, 0.002990245819091797, 0.003266453742980957, 0.003542661666870117, 0.0038188695907592773, 0.0040950775146484375, 0.004371285438537598, 0.004647493362426758, 0.004923701286315918, 0.005199909210205078, 0.005476117134094238, 0.0057523250579833984, 0.006028532981872559, 0.006304740905761719, 0.006580948829650879, 0.006857156753540039, 0.007133364677429199, 0.007409572601318359, 0.0076857805252075195, 0.00796198844909668, 0.00823819637298584, 0.008514404296875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 1.0, 0.0, 6.0, 4.0, 6.0, 3.0, 11.0, 10.0, 27.0, 26.0, 15.0, 24.0, 45.0, 67.0, 68.0, 114.0, 107.0, 112.0, 79.0, 58.0, 49.0, 38.0, 18.0, 17.0, 14.0, 15.0, 11.0, 11.0, 4.0, 6.0, 7.0, 6.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002429962158203125, -0.0023506879806518555, -0.002271413803100586, -0.0021921396255493164, -0.002112865447998047, -0.0020335912704467773, -0.001954317092895508, -0.0018750429153442383, -0.0017957687377929688, -0.0017164945602416992, -0.0016372203826904297, -0.0015579462051391602, -0.0014786720275878906, -0.001399397850036621, -0.0013201236724853516, -0.001240849494934082, -0.0011615753173828125, -0.001082301139831543, -0.0010030269622802734, -0.0009237527847290039, -0.0008444786071777344, -0.0007652044296264648, -0.0006859302520751953, -0.0006066560745239258, -0.0005273818969726562, -0.0004481077194213867, -0.0003688335418701172, -0.00028955936431884766, -0.00021028518676757812, -0.0001310110092163086, -5.173683166503906e-05, 2.753734588623047e-05, 0.0001068115234375, 0.00018608570098876953, 0.00026535987854003906, 0.0003446340560913086, 0.0004239082336425781, 0.0005031824111938477, 0.0005824565887451172, 0.0006617307662963867, 0.0007410049438476562, 0.0008202791213989258, 0.0008995532989501953, 0.0009788274765014648, 0.0010581016540527344, 0.001137375831604004, 0.0012166500091552734, 0.001295924186706543, 0.0013751983642578125, 0.001454472541809082, 0.0015337467193603516, 0.001613020896911621, 0.0016922950744628906, 0.0017715692520141602, 0.0018508434295654297, 0.0019301176071166992, 0.0020093917846679688, 0.0020886659622192383, 0.002167940139770508, 0.0022472143173217773, 0.002326488494873047, 0.0024057626724243164, 0.002485036849975586, 0.0025643110275268555, 0.002643585205078125]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 7.0, 6.0, 10.0, 3.0, 13.0, 9.0, 23.0, 16.0, 16.0, 30.0, 38.0, 44.0, 44.0, 67.0, 69.0, 86.0, 78.0, 74.0, 59.0, 46.0, 52.0, 27.0, 33.0, 26.0, 20.0, 15.0, 15.0, 16.0, 9.0, 12.0, 6.0, 7.0, 3.0, 3.0, 1.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.14434586465358734, -0.14026324450969696, -0.13618060946464539, -0.132097989320755, -0.12801536917686462, -0.12393274903297424, -0.11985012143850327, -0.11576749384403229, -0.1116848737001419, -0.10760225355625153, -0.10351962596178055, -0.09943699836730957, -0.09535437822341919, -0.09127175807952881, -0.08718913048505783, -0.08310650289058685, -0.07902388274669647, -0.07494126260280609, -0.07085863500833511, -0.06677600741386414, -0.06269338726997375, -0.058610763400793076, -0.054528139531612396, -0.05044551566243172, -0.04636289179325104, -0.04228026792407036, -0.03819764405488968, -0.034115020185709, -0.03003239631652832, -0.02594977244734764, -0.02186714857816696, -0.017784524708986282, -0.013701893389225006, -0.009619269520044327, -0.0055366456508636475, -0.0014540217816829681, 0.002628602087497711, 0.0067112259566783905, 0.01079384982585907, 0.01487647369503975, 0.01895909756422043, 0.023041721433401108, 0.027124345302581787, 0.031206969171762466, 0.035289593040943146, 0.039372216910123825, 0.043454840779304504, 0.047537464648485184, 0.05162008851766586, 0.05570271238684654, 0.05978533625602722, 0.0638679563999176, 0.06795058399438858, 0.07203321158885956, 0.07611583173274994, 0.08019845187664032, 0.0842810794711113, 0.08836370706558228, 0.09244632720947266, 0.09652894735336304, 0.10061157494783401, 0.10469420254230499, 0.10877682268619537, 0.11285944283008575, 0.11694207042455673]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 3.0, 2.0, 4.0, 10.0, 5.0, 8.0, 8.0, 15.0, 14.0, 18.0, 23.0, 33.0, 28.0, 24.0, 37.0, 30.0, 30.0, 32.0, 38.0, 39.0, 35.0, 34.0, 37.0, 41.0, 30.0, 37.0, 37.0, 40.0, 41.0, 32.0, 25.0, 27.0, 24.0, 18.0, 21.0, 26.0, 14.0, 14.0, 12.0, 14.0, 15.0, 5.0, 7.0, 7.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.102790966629982, -0.09945085644721985, -0.0961107462644577, -0.09277063608169556, -0.08943052589893341, -0.08609041571617126, -0.08275030553340912, -0.07941019535064697, -0.07607008516788483, -0.07272997498512268, -0.06938986480236053, -0.06604975461959839, -0.06270964443683624, -0.0593695342540741, -0.05602942407131195, -0.052689313888549805, -0.04934920370578766, -0.04600909352302551, -0.04266898334026337, -0.03932887315750122, -0.035988762974739075, -0.03264865279197693, -0.029308542609214783, -0.025968432426452637, -0.02262832224369049, -0.019288212060928345, -0.0159481018781662, -0.012607991695404053, -0.009267881512641907, -0.005927771329879761, -0.0025876611471176147, 0.0007524490356445312, 0.004092566668987274, 0.00743267685174942, 0.010772787034511566, 0.014112897217273712, 0.017453007400035858, 0.020793117582798004, 0.02413322776556015, 0.027473337948322296, 0.030813448131084442, 0.03415355831384659, 0.037493668496608734, 0.04083377867937088, 0.044173888862133026, 0.04751399904489517, 0.05085410922765732, 0.054194219410419464, 0.05753432959318161, 0.060874439775943756, 0.0642145499587059, 0.06755466014146805, 0.0708947703242302, 0.07423488050699234, 0.07757499068975449, 0.08091510087251663, 0.08425521105527878, 0.08759532123804092, 0.09093543142080307, 0.09427554160356522, 0.09761565178632736, 0.10095576196908951, 0.10429587215185165, 0.1076359823346138, 0.11097609251737595]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 11.0, 12.0, 14.0, 29.0, 60.0, 84.0, 140.0, 233.0, 352.0, 592.0, 895.0, 1503.0, 2386.0, 3990.0, 6737.0, 11514.0, 19862.0, 35651.0, 65264.0, 129709.0, 288313.0, 241601.0, 109426.0, 56410.0, 31122.0, 17343.0, 10143.0, 6066.0, 3471.0, 2157.0, 1304.0, 837.0, 515.0, 286.0, 194.0, 123.0, 73.0, 47.0, 36.0, 16.0, 20.0, 8.0, 2.0, 3.0, 3.0, 4.0, 2.0], "bins": [-0.30419921875, -0.2961692810058594, -0.28813934326171875, -0.2801094055175781, -0.2720794677734375, -0.2640495300292969, -0.25601959228515625, -0.24798965454101562, -0.239959716796875, -0.23192977905273438, -0.22389984130859375, -0.21586990356445312, -0.2078399658203125, -0.19981002807617188, -0.19178009033203125, -0.18375015258789062, -0.17572021484375, -0.16769027709960938, -0.15966033935546875, -0.15163040161132812, -0.1436004638671875, -0.13557052612304688, -0.12754058837890625, -0.11951065063476562, -0.111480712890625, -0.10345077514648438, -0.09542083740234375, -0.08739089965820312, -0.0793609619140625, -0.07133102416992188, -0.06330108642578125, -0.055271148681640625, -0.0472412109375, -0.039211273193359375, -0.03118133544921875, -0.023151397705078125, -0.0151214599609375, -0.007091522216796875, 0.00093841552734375, 0.008968353271484375, 0.016998291015625, 0.025028228759765625, 0.03305816650390625, 0.041088104248046875, 0.0491180419921875, 0.057147979736328125, 0.06517791748046875, 0.07320785522460938, 0.08123779296875, 0.08926773071289062, 0.09729766845703125, 0.10532760620117188, 0.1133575439453125, 0.12138748168945312, 0.12941741943359375, 0.13744735717773438, 0.145477294921875, 0.15350723266601562, 0.16153717041015625, 0.16956710815429688, 0.1775970458984375, 0.18562698364257812, 0.19365692138671875, 0.20168685913085938, 0.209716796875]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 0.0, 6.0, 2.0, 5.0, 8.0, 8.0, 18.0, 10.0, 19.0, 21.0, 17.0, 39.0, 29.0, 22.0, 33.0, 35.0, 39.0, 36.0, 32.0, 48.0, 39.0, 43.0, 34.0, 41.0, 36.0, 41.0, 45.0, 38.0, 37.0, 27.0, 31.0, 30.0, 15.0, 23.0, 18.0, 16.0, 9.0, 7.0, 9.0, 13.0, 9.0, 6.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0987548828125, -0.09554862976074219, -0.09234237670898438, -0.08913612365722656, -0.08592987060546875, -0.08272361755371094, -0.07951736450195312, -0.07631111145019531, -0.0731048583984375, -0.06989860534667969, -0.06669235229492188, -0.06348609924316406, -0.06027984619140625, -0.05707359313964844, -0.053867340087890625, -0.05066108703613281, -0.047454833984375, -0.04424858093261719, -0.041042327880859375, -0.03783607482910156, -0.03462982177734375, -0.03142356872558594, -0.028217315673828125, -0.025011062622070312, -0.0218048095703125, -0.018598556518554688, -0.015392303466796875, -0.012186050415039062, -0.00897979736328125, -0.0057735443115234375, -0.002567291259765625, 0.0006389617919921875, 0.00384521484375, 0.0070514678955078125, 0.010257720947265625, 0.013463973999023438, 0.01667022705078125, 0.019876480102539062, 0.023082733154296875, 0.026288986206054688, 0.0294952392578125, 0.03270149230957031, 0.035907745361328125, 0.03911399841308594, 0.04232025146484375, 0.04552650451660156, 0.048732757568359375, 0.05193901062011719, 0.055145263671875, 0.05835151672363281, 0.061557769775390625, 0.06476402282714844, 0.06797027587890625, 0.07117652893066406, 0.07438278198242188, 0.07758903503417969, 0.0807952880859375, 0.08400154113769531, 0.08720779418945312, 0.09041404724121094, 0.09362030029296875, 0.09682655334472656, 0.10003280639648438, 0.10323905944824219, 0.1064453125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 3.0, 15.0, 22.0, 32.0, 48.0, 73.0, 94.0, 108.0, 200.0, 265.0, 406.0, 581.0, 880.0, 1288.0, 2026.0, 3115.0, 4755.0, 7350.0, 11485.0, 18163.0, 28590.0, 46383.0, 79055.0, 142181.0, 261872.0, 185730.0, 100273.0, 57548.0, 34838.0, 21793.0, 13582.0, 8906.0, 5895.0, 3758.0, 2553.0, 1628.0, 999.0, 628.0, 424.0, 285.0, 213.0, 143.0, 104.0, 84.0, 57.0, 44.0, 28.0, 14.0, 16.0, 12.0, 0.0, 4.0, 6.0, 2.0], "bins": [-0.21826171875, -0.2119731903076172, -0.20568466186523438, -0.19939613342285156, -0.19310760498046875, -0.18681907653808594, -0.18053054809570312, -0.1742420196533203, -0.1679534912109375, -0.1616649627685547, -0.15537643432617188, -0.14908790588378906, -0.14279937744140625, -0.13651084899902344, -0.13022232055664062, -0.12393379211425781, -0.117645263671875, -0.11135673522949219, -0.10506820678710938, -0.09877967834472656, -0.09249114990234375, -0.08620262145996094, -0.07991409301757812, -0.07362556457519531, -0.0673370361328125, -0.06104850769042969, -0.054759979248046875, -0.04847145080566406, -0.04218292236328125, -0.03589439392089844, -0.029605865478515625, -0.023317337036132812, -0.01702880859375, -0.010740280151367188, -0.004451751708984375, 0.0018367767333984375, 0.00812530517578125, 0.014413833618164062, 0.020702362060546875, 0.026990890502929688, 0.0332794189453125, 0.03956794738769531, 0.045856475830078125, 0.05214500427246094, 0.05843353271484375, 0.06472206115722656, 0.07101058959960938, 0.07729911804199219, 0.083587646484375, 0.08987617492675781, 0.09616470336914062, 0.10245323181152344, 0.10874176025390625, 0.11503028869628906, 0.12131881713867188, 0.1276073455810547, 0.1338958740234375, 0.1401844024658203, 0.14647293090820312, 0.15276145935058594, 0.15904998779296875, 0.16533851623535156, 0.17162704467773438, 0.1779155731201172, 0.1842041015625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 9.0, 8.0, 8.0, 7.0, 9.0, 13.0, 14.0, 16.0, 19.0, 15.0, 20.0, 17.0, 22.0, 23.0, 33.0, 28.0, 24.0, 37.0, 38.0, 37.0, 31.0, 29.0, 37.0, 34.0, 37.0, 33.0, 31.0, 39.0, 39.0, 23.0, 27.0, 31.0, 18.0, 29.0, 29.0, 24.0, 15.0, 13.0, 16.0, 6.0, 8.0, 10.0, 6.0, 8.0, 6.0, 8.0, 5.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.058349609375, -0.05663442611694336, -0.05491924285888672, -0.05320405960083008, -0.05148887634277344, -0.0497736930847168, -0.048058509826660156, -0.046343326568603516, -0.044628143310546875, -0.042912960052490234, -0.041197776794433594, -0.03948259353637695, -0.03776741027832031, -0.03605222702026367, -0.03433704376220703, -0.03262186050415039, -0.03090667724609375, -0.02919149398803711, -0.02747631072998047, -0.025761127471923828, -0.024045944213867188, -0.022330760955810547, -0.020615577697753906, -0.018900394439697266, -0.017185211181640625, -0.015470027923583984, -0.013754844665527344, -0.012039661407470703, -0.010324478149414062, -0.008609294891357422, -0.006894111633300781, -0.005178928375244141, -0.0034637451171875, -0.0017485618591308594, -3.337860107421875e-05, 0.0016818046569824219, 0.0033969879150390625, 0.005112171173095703, 0.006827354431152344, 0.008542537689208984, 0.010257720947265625, 0.011972904205322266, 0.013688087463378906, 0.015403270721435547, 0.017118453979492188, 0.018833637237548828, 0.02054882049560547, 0.02226400375366211, 0.02397918701171875, 0.02569437026977539, 0.02740955352783203, 0.029124736785888672, 0.030839920043945312, 0.03255510330200195, 0.034270286560058594, 0.035985469818115234, 0.037700653076171875, 0.039415836334228516, 0.041131019592285156, 0.0428462028503418, 0.04456138610839844, 0.04627656936645508, 0.04799175262451172, 0.04970693588256836, 0.051422119140625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 9.0, 5.0, 10.0, 15.0, 14.0, 27.0, 25.0, 43.0, 63.0, 60.0, 95.0, 133.0, 186.0, 243.0, 321.0, 426.0, 523.0, 652.0, 873.0, 1205.0, 1747.0, 2897.0, 5440.0, 12526.0, 44069.0, 782210.0, 148841.0, 24675.0, 8992.0, 4091.0, 2311.0, 1488.0, 1069.0, 738.0, 571.0, 444.0, 355.0, 237.0, 230.0, 152.0, 126.0, 92.0, 76.0, 62.0, 55.0, 38.0, 26.0, 19.0, 15.0, 14.0, 11.0, 3.0, 3.0, 1.0], "bins": [-0.0234527587890625, -0.022797584533691406, -0.022142410278320312, -0.02148723602294922, -0.020832061767578125, -0.02017688751220703, -0.019521713256835938, -0.018866539001464844, -0.01821136474609375, -0.017556190490722656, -0.016901016235351562, -0.01624584197998047, -0.015590667724609375, -0.014935493469238281, -0.014280319213867188, -0.013625144958496094, -0.012969970703125, -0.012314796447753906, -0.011659622192382812, -0.011004447937011719, -0.010349273681640625, -0.009694099426269531, -0.009038925170898438, -0.008383750915527344, -0.00772857666015625, -0.007073402404785156, -0.0064182281494140625, -0.005763053894042969, -0.005107879638671875, -0.004452705383300781, -0.0037975311279296875, -0.0031423568725585938, -0.0024871826171875, -0.0018320083618164062, -0.0011768341064453125, -0.0005216598510742188, 0.000133514404296875, 0.0007886886596679688, 0.0014438629150390625, 0.0020990371704101562, 0.00275421142578125, 0.0034093856811523438, 0.0040645599365234375, 0.004719734191894531, 0.005374908447265625, 0.006030082702636719, 0.0066852569580078125, 0.007340431213378906, 0.00799560546875, 0.008650779724121094, 0.009305953979492188, 0.009961128234863281, 0.010616302490234375, 0.011271476745605469, 0.011926651000976562, 0.012581825256347656, 0.01323699951171875, 0.013892173767089844, 0.014547348022460938, 0.015202522277832031, 0.015857696533203125, 0.01651287078857422, 0.017168045043945312, 0.017823219299316406, 0.0184783935546875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 5.0, 2.0, 5.0, 2.0, 0.0, 9.0, 18.0, 14.0, 25.0, 37.0, 0.0, 71.0, 89.0, 113.0, 171.0, 0.0, 133.0, 102.0, 68.0, 50.0, 0.0, 31.0, 24.0, 12.0, 7.0, 5.0, 0.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2516975402832031e-06, -1.2032687664031982e-06, -1.1548399925231934e-06, -1.1064112186431885e-06, -1.0579824447631836e-06, -1.0095536708831787e-06, -9.611248970031738e-07, -9.126961231231689e-07, -8.642673492431641e-07, -8.158385753631592e-07, -7.674098014831543e-07, -7.189810276031494e-07, -6.705522537231445e-07, -6.221234798431396e-07, -5.736947059631348e-07, -5.252659320831299e-07, -4.76837158203125e-07, -4.284083843231201e-07, -3.7997961044311523e-07, -3.3155083656311035e-07, -2.8312206268310547e-07, -2.3469328880310059e-07, -1.862645149230957e-07, -1.3783574104309082e-07, -8.940696716308594e-08, -4.0978193283081055e-08, 7.450580596923828e-09, 5.587935447692871e-08, 1.043081283569336e-07, 1.5273690223693848e-07, 2.0116567611694336e-07, 2.4959444999694824e-07, 2.980232238769531e-07, 3.46451997756958e-07, 3.948807716369629e-07, 4.4330954551696777e-07, 4.917383193969727e-07, 5.401670932769775e-07, 5.885958671569824e-07, 6.370246410369873e-07, 6.854534149169922e-07, 7.338821887969971e-07, 7.82310962677002e-07, 8.307397365570068e-07, 8.791685104370117e-07, 9.275972843170166e-07, 9.760260581970215e-07, 1.0244548320770264e-06, 1.0728836059570312e-06, 1.1213123798370361e-06, 1.169741153717041e-06, 1.218169927597046e-06, 1.2665987014770508e-06, 1.3150274753570557e-06, 1.3634562492370605e-06, 1.4118850231170654e-06, 1.4603137969970703e-06, 1.5087425708770752e-06, 1.55717134475708e-06, 1.605600118637085e-06, 1.6540288925170898e-06, 1.7024576663970947e-06, 1.7508864402770996e-06, 1.7993152141571045e-06, 1.8477439880371094e-06]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 1.0, 5.0, 5.0, 8.0, 9.0, 18.0, 30.0, 39.0, 52.0, 78.0, 113.0, 155.0, 200.0, 303.0, 387.0, 536.0, 840.0, 1105.0, 1477.0, 2250.0, 3817.0, 9860.0, 51169.0, 890369.0, 62328.0, 11316.0, 4275.0, 2352.0, 1641.0, 1059.0, 749.0, 574.0, 402.0, 288.0, 225.0, 139.0, 106.0, 90.0, 45.0, 47.0, 30.0, 16.0, 21.0, 10.0, 7.0, 6.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.031463623046875, -0.030525684356689453, -0.029587745666503906, -0.02864980697631836, -0.027711868286132812, -0.026773929595947266, -0.02583599090576172, -0.024898052215576172, -0.023960113525390625, -0.023022174835205078, -0.02208423614501953, -0.021146297454833984, -0.020208358764648438, -0.01927042007446289, -0.018332481384277344, -0.017394542694091797, -0.01645660400390625, -0.015518665313720703, -0.014580726623535156, -0.01364278793334961, -0.012704849243164062, -0.011766910552978516, -0.010828971862792969, -0.009891033172607422, -0.008953094482421875, -0.008015155792236328, -0.007077217102050781, -0.006139278411865234, -0.0052013397216796875, -0.004263401031494141, -0.0033254623413085938, -0.002387523651123047, -0.0014495849609375, -0.0005116462707519531, 0.00042629241943359375, 0.0013642311096191406, 0.0023021697998046875, 0.0032401084899902344, 0.004178047180175781, 0.005115985870361328, 0.006053924560546875, 0.006991863250732422, 0.007929801940917969, 0.008867740631103516, 0.009805679321289062, 0.01074361801147461, 0.011681556701660156, 0.012619495391845703, 0.01355743408203125, 0.014495372772216797, 0.015433311462402344, 0.01637125015258789, 0.017309188842773438, 0.018247127532958984, 0.01918506622314453, 0.020123004913330078, 0.021060943603515625, 0.021998882293701172, 0.02293682098388672, 0.023874759674072266, 0.024812698364257812, 0.02575063705444336, 0.026688575744628906, 0.027626514434814453, 0.028564453125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 7.0, 10.0, 33.0, 68.0, 135.0, 508.0, 115.0, 43.0, 35.0, 13.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007579803466796875, -0.007330119609832764, -0.007080435752868652, -0.006830751895904541, -0.00658106803894043, -0.006331384181976318, -0.006081700325012207, -0.005832016468048096, -0.005582332611083984, -0.005332648754119873, -0.005082964897155762, -0.00483328104019165, -0.004583597183227539, -0.004333913326263428, -0.004084229469299316, -0.003834545612335205, -0.0035848617553710938, -0.0033351778984069824, -0.003085494041442871, -0.0028358101844787598, -0.0025861263275146484, -0.002336442470550537, -0.0020867586135864258, -0.0018370747566223145, -0.0015873908996582031, -0.0013377070426940918, -0.0010880231857299805, -0.0008383393287658691, -0.0005886554718017578, -0.0003389716148376465, -8.928775787353516e-05, 0.00016039609909057617, 0.0004100799560546875, 0.0006597638130187988, 0.0009094476699829102, 0.0011591315269470215, 0.0014088153839111328, 0.0016584992408752441, 0.0019081830978393555, 0.002157866954803467, 0.002407550811767578, 0.0026572346687316895, 0.0029069185256958008, 0.003156602382659912, 0.0034062862396240234, 0.0036559700965881348, 0.003905653953552246, 0.004155337810516357, 0.004405021667480469, 0.00465470552444458, 0.004904389381408691, 0.005154073238372803, 0.005403757095336914, 0.005653440952301025, 0.005903124809265137, 0.006152808666229248, 0.006402492523193359, 0.006652176380157471, 0.006901860237121582, 0.007151544094085693, 0.007401227951049805, 0.007650911808013916, 0.007900595664978027, 0.008150279521942139, 0.00839996337890625]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 4.0, 4.0, 4.0, 11.0, 8.0, 15.0, 24.0, 18.0, 27.0, 38.0, 48.0, 62.0, 84.0, 109.0, 112.0, 92.0, 67.0, 47.0, 34.0, 40.0, 34.0, 33.0, 12.0, 15.0, 4.0, 10.0, 10.0, 6.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15270934998989105, -0.14814087748527527, -0.14357241988182068, -0.1390039473772049, -0.1344354897737503, -0.12986701726913452, -0.12529855966567993, -0.12073008716106415, -0.11616162210702896, -0.11159315705299377, -0.10702469199895859, -0.1024562269449234, -0.09788775444030762, -0.09331929683685303, -0.08875082433223724, -0.08418235927820206, -0.07961389422416687, -0.07504542917013168, -0.0704769641160965, -0.06590849906206131, -0.061340030282735825, -0.05677156522870064, -0.05220309644937515, -0.047634631395339966, -0.04306616634130478, -0.03849770128726959, -0.033929236233234406, -0.02936076745390892, -0.024792302399873734, -0.020223837345838547, -0.01565537042915821, -0.011086903512477875, -0.006518453359603882, -0.0019499873742461205, 0.002618478611111641, 0.007186944596469402, 0.011755410581827164, 0.01632387563586235, 0.020892342552542686, 0.025460809469223022, 0.03002927452325821, 0.034597739577293396, 0.03916620463132858, 0.04373467341065407, 0.048303138464689255, 0.05287160351872444, 0.05744007229804993, 0.062008537352085114, 0.0665770024061203, 0.07114546746015549, 0.07571393251419067, 0.08028239756822586, 0.08485086262226105, 0.08941933512687683, 0.09398780018091202, 0.0985562652349472, 0.10312473028898239, 0.10769319534301758, 0.11226166039705276, 0.11683012545108795, 0.12139859795570374, 0.12596705555915833, 0.1305355280637741, 0.1351040005683899, 0.13967245817184448]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 11.0, 7.0, 7.0, 8.0, 10.0, 14.0, 11.0, 22.0, 18.0, 11.0, 19.0, 36.0, 32.0, 34.0, 37.0, 37.0, 28.0, 25.0, 34.0, 46.0, 24.0, 30.0, 29.0, 46.0, 46.0, 40.0, 44.0, 35.0, 28.0, 27.0, 30.0, 22.0, 26.0, 21.0, 17.0, 22.0, 15.0, 7.0, 9.0, 8.0, 5.0, 6.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.08891312032938004, -0.08587145805358887, -0.0828297883272171, -0.07978812605142593, -0.07674645632505417, -0.073704794049263, -0.07066312432289124, -0.06762146204710007, -0.0645797997713089, -0.06153813377022743, -0.058496467769145966, -0.0554548054933548, -0.05241313949227333, -0.049371473491191864, -0.0463298074901104, -0.04328814148902893, -0.040246475487947464, -0.037204809486866, -0.03416314348578453, -0.031121479347348213, -0.028079815208911896, -0.02503814920783043, -0.021996483206748962, -0.018954819068312645, -0.01591315306723118, -0.012871487997472286, -0.009829822927713394, -0.0067881569266319275, -0.0037464918568730354, -0.0007048267871141434, 0.0023368392139673233, 0.005378503352403641, 0.008420169353485107, 0.011461834423244, 0.014503499493002892, 0.017545165494084358, 0.020586829632520676, 0.023628495633602142, 0.02667016163468361, 0.029711825773119926, 0.032753489911556244, 0.03579515591263771, 0.03883682191371918, 0.041878484189510345, 0.04492015019059181, 0.04796181619167328, 0.051003482192754745, 0.05404514819383621, 0.05708681419491768, 0.060128480195999146, 0.06317014247179031, 0.06621181219816208, 0.06925347447395325, 0.07229514420032501, 0.07533680647611618, 0.07837846875190735, 0.08142013847827911, 0.08446180075407028, 0.08750347048044205, 0.09054513275623322, 0.09358680248260498, 0.09662846475839615, 0.09967012703418732, 0.10271179676055908, 0.10575345903635025]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 0.0, 5.0, 7.0, 12.0, 22.0, 25.0, 35.0, 46.0, 73.0, 99.0, 182.0, 270.0, 444.0, 623.0, 957.0, 1581.0, 2481.0, 4253.0, 6953.0, 12234.0, 22126.0, 41453.0, 83780.0, 186322.0, 610074.0, 2130353.0, 691916.0, 200985.0, 92073.0, 46263.0, 24732.0, 13738.0, 7783.0, 4605.0, 2833.0, 1703.0, 1087.0, 724.0, 465.0, 313.0, 208.0, 133.0, 106.0, 74.0, 49.0, 23.0, 24.0, 11.0, 11.0, 7.0, 4.0, 0.0, 8.0, 0.0, 0.0, 2.0], "bins": [-0.1759033203125, -0.17066001892089844, -0.16541671752929688, -0.1601734161376953, -0.15493011474609375, -0.1496868133544922, -0.14444351196289062, -0.13920021057128906, -0.1339569091796875, -0.12871360778808594, -0.12347030639648438, -0.11822700500488281, -0.11298370361328125, -0.10774040222167969, -0.10249710083007812, -0.09725379943847656, -0.092010498046875, -0.08676719665527344, -0.08152389526367188, -0.07628059387207031, -0.07103729248046875, -0.06579399108886719, -0.060550689697265625, -0.05530738830566406, -0.0500640869140625, -0.04482078552246094, -0.039577484130859375, -0.03433418273925781, -0.02909088134765625, -0.023847579956054688, -0.018604278564453125, -0.013360977172851562, -0.00811767578125, -0.0028743743896484375, 0.002368927001953125, 0.0076122283935546875, 0.01285552978515625, 0.018098831176757812, 0.023342132568359375, 0.028585433959960938, 0.0338287353515625, 0.03907203674316406, 0.044315338134765625, 0.04955863952636719, 0.05480194091796875, 0.06004524230957031, 0.06528854370117188, 0.07053184509277344, 0.075775146484375, 0.08101844787597656, 0.08626174926757812, 0.09150505065917969, 0.09674835205078125, 0.10199165344238281, 0.10723495483398438, 0.11247825622558594, 0.1177215576171875, 0.12296485900878906, 0.12820816040039062, 0.1334514617919922, 0.13869476318359375, 0.1439380645751953, 0.14918136596679688, 0.15442466735839844, 0.15966796875]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 6.0, 14.0, 15.0, 10.0, 19.0, 15.0, 11.0, 18.0, 34.0, 35.0, 36.0, 28.0, 43.0, 35.0, 28.0, 28.0, 36.0, 37.0, 38.0, 28.0, 46.0, 45.0, 44.0, 43.0, 38.0, 39.0, 25.0, 30.0, 26.0, 13.0, 22.0, 20.0, 23.0, 17.0, 6.0, 5.0, 5.0, 2.0, 5.0, 7.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0], "bins": [-0.055694580078125, -0.05386686325073242, -0.052039146423339844, -0.050211429595947266, -0.04838371276855469, -0.04655599594116211, -0.04472827911376953, -0.04290056228637695, -0.041072845458984375, -0.0392451286315918, -0.03741741180419922, -0.03558969497680664, -0.03376197814941406, -0.031934261322021484, -0.030106544494628906, -0.028278827667236328, -0.02645111083984375, -0.024623394012451172, -0.022795677185058594, -0.020967960357666016, -0.019140243530273438, -0.01731252670288086, -0.015484809875488281, -0.013657093048095703, -0.011829376220703125, -0.010001659393310547, -0.008173942565917969, -0.006346225738525391, -0.0045185089111328125, -0.0026907920837402344, -0.0008630752563476562, 0.0009646415710449219, 0.0027923583984375, 0.004620075225830078, 0.006447792053222656, 0.008275508880615234, 0.010103225708007812, 0.01193094253540039, 0.013758659362792969, 0.015586376190185547, 0.017414093017578125, 0.019241809844970703, 0.02106952667236328, 0.02289724349975586, 0.024724960327148438, 0.026552677154541016, 0.028380393981933594, 0.030208110809326172, 0.03203582763671875, 0.03386354446411133, 0.035691261291503906, 0.037518978118896484, 0.03934669494628906, 0.04117441177368164, 0.04300212860107422, 0.0448298454284668, 0.046657562255859375, 0.04848527908325195, 0.05031299591064453, 0.05214071273803711, 0.05396842956542969, 0.055796146392822266, 0.057623863220214844, 0.05945158004760742, 0.061279296875]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 4.0, 16.0, 20.0, 37.0, 65.0, 72.0, 102.0, 176.0, 238.0, 410.0, 596.0, 929.0, 1448.0, 2273.0, 3358.0, 5196.0, 8272.0, 13199.0, 20739.0, 34091.0, 56800.0, 98589.0, 183359.0, 370493.0, 900793.0, 1378550.0, 544421.0, 251382.0, 131360.0, 72852.0, 42876.0, 26093.0, 16431.0, 10342.0, 6665.0, 4216.0, 2623.0, 1807.0, 1184.0, 784.0, 495.0, 323.0, 214.0, 136.0, 78.0, 68.0, 42.0, 31.0, 13.0, 18.0, 2.0, 6.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10174560546875, -0.09868431091308594, -0.09562301635742188, -0.09256172180175781, -0.08950042724609375, -0.08643913269042969, -0.08337783813476562, -0.08031654357910156, -0.0772552490234375, -0.07419395446777344, -0.07113265991210938, -0.06807136535644531, -0.06501007080078125, -0.06194877624511719, -0.058887481689453125, -0.05582618713378906, -0.052764892578125, -0.04970359802246094, -0.046642303466796875, -0.04358100891113281, -0.04051971435546875, -0.03745841979980469, -0.034397125244140625, -0.03133583068847656, -0.0282745361328125, -0.025213241577148438, -0.022151947021484375, -0.019090652465820312, -0.01602935791015625, -0.012968063354492188, -0.009906768798828125, -0.0068454742431640625, -0.0037841796875, -0.0007228851318359375, 0.002338409423828125, 0.0053997039794921875, 0.00846099853515625, 0.011522293090820312, 0.014583587646484375, 0.017644882202148438, 0.0207061767578125, 0.023767471313476562, 0.026828765869140625, 0.029890060424804688, 0.03295135498046875, 0.03601264953613281, 0.039073944091796875, 0.04213523864746094, 0.045196533203125, 0.04825782775878906, 0.051319122314453125, 0.05438041687011719, 0.05744171142578125, 0.06050300598144531, 0.06356430053710938, 0.06662559509277344, 0.0696868896484375, 0.07274818420410156, 0.07580947875976562, 0.07887077331542969, 0.08193206787109375, 0.08499336242675781, 0.08805465698242188, 0.09111595153808594, 0.09417724609375]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 2.0, 5.0, 4.0, 12.0, 11.0, 19.0, 33.0, 35.0, 26.0, 41.0, 34.0, 52.0, 58.0, 69.0, 105.0, 108.0, 121.0, 143.0, 194.0, 195.0, 220.0, 229.0, 279.0, 319.0, 264.0, 227.0, 195.0, 162.0, 145.0, 142.0, 102.0, 109.0, 58.0, 80.0, 60.0, 32.0, 48.0, 24.0, 23.0, 23.0, 16.0, 12.0, 9.0, 9.0, 9.0, 3.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.030303955078125, -0.029330730438232422, -0.028357505798339844, -0.027384281158447266, -0.026411056518554688, -0.02543783187866211, -0.02446460723876953, -0.023491382598876953, -0.022518157958984375, -0.021544933319091797, -0.02057170867919922, -0.01959848403930664, -0.018625259399414062, -0.017652034759521484, -0.016678810119628906, -0.015705585479736328, -0.01473236083984375, -0.013759136199951172, -0.012785911560058594, -0.011812686920166016, -0.010839462280273438, -0.00986623764038086, -0.008893013000488281, -0.007919788360595703, -0.006946563720703125, -0.005973339080810547, -0.005000114440917969, -0.004026889801025391, -0.0030536651611328125, -0.0020804405212402344, -0.0011072158813476562, -0.00013399124145507812, 0.0008392333984375, 0.0018124580383300781, 0.0027856826782226562, 0.0037589073181152344, 0.0047321319580078125, 0.005705356597900391, 0.006678581237792969, 0.007651805877685547, 0.008625030517578125, 0.009598255157470703, 0.010571479797363281, 0.01154470443725586, 0.012517929077148438, 0.013491153717041016, 0.014464378356933594, 0.015437602996826172, 0.01641082763671875, 0.017384052276611328, 0.018357276916503906, 0.019330501556396484, 0.020303726196289062, 0.02127695083618164, 0.02225017547607422, 0.023223400115966797, 0.024196624755859375, 0.025169849395751953, 0.02614307403564453, 0.02711629867553711, 0.028089523315429688, 0.029062747955322266, 0.030035972595214844, 0.031009197235107422, 0.031982421875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 5.0, 7.0, 7.0, 7.0, 10.0, 12.0, 10.0, 10.0, 13.0, 23.0, 27.0, 55.0, 62.0, 58.0, 99.0, 86.0, 91.0, 78.0, 61.0, 65.0, 33.0, 35.0, 22.0, 30.0, 17.0, 12.0, 13.0, 7.0, 4.0, 7.0, 9.0, 9.0, 3.0, 2.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09388542175292969, -0.09097446501255035, -0.08806350827217102, -0.08515255153179169, -0.08224160224199295, -0.07933064550161362, -0.07641968876123428, -0.07350873202085495, -0.07059778273105621, -0.06768682599067688, -0.06477586925029755, -0.06186491623520851, -0.058953963220119476, -0.05604300647974014, -0.05313204973936081, -0.050221092998981476, -0.04731013625860214, -0.04439917951822281, -0.041488226503133774, -0.03857726976275444, -0.035666316747665405, -0.03275536000728607, -0.02984440326690674, -0.026933448389172554, -0.02402249351143837, -0.021111538633704185, -0.01820058375597, -0.015289627015590668, -0.012378672137856483, -0.0094677172601223, -0.006556760519742966, -0.0036458056420087814, -0.0007348582148551941, 0.0021760971285402775, 0.005087052471935749, 0.007998008280992508, 0.010908963158726692, 0.013819918036460876, 0.01673087477684021, 0.019641829654574394, 0.02255278453230858, 0.025463739410042763, 0.028374694287776947, 0.03128565102815628, 0.034196607768535614, 0.03710756078362465, 0.04001851752400398, 0.04292947053909302, 0.04584042727947235, 0.048751384019851685, 0.05166233703494072, 0.05457329377532005, 0.05748424679040909, 0.06039520353078842, 0.06330616027116776, 0.06621711701154709, 0.06912806630134583, 0.07203902304172516, 0.07494997978210449, 0.07786093652248383, 0.08077188581228256, 0.0836828425526619, 0.08659379929304123, 0.08950475603342056, 0.0924157127737999]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 1.0, 6.0, 3.0, 10.0, 14.0, 9.0, 10.0, 10.0, 15.0, 16.0, 15.0, 21.0, 24.0, 31.0, 29.0, 20.0, 27.0, 36.0, 28.0, 29.0, 49.0, 43.0, 51.0, 34.0, 38.0, 41.0, 39.0, 45.0, 33.0, 33.0, 39.0, 28.0, 25.0, 28.0, 15.0, 14.0, 16.0, 18.0, 14.0, 7.0, 11.0, 4.0, 10.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.06475847959518433, -0.06278478354215622, -0.06081108748912811, -0.058837391436100006, -0.0568636953830719, -0.05488999933004379, -0.052916303277015686, -0.05094260722398758, -0.04896891117095947, -0.046995215117931366, -0.04502151906490326, -0.04304782301187515, -0.041074126958847046, -0.03910043090581894, -0.03712673485279083, -0.035153038799762726, -0.03317933902144432, -0.031205642968416214, -0.029231946915388107, -0.02725825086236, -0.025284554809331894, -0.023310858756303787, -0.02133716084063053, -0.019363464787602425, -0.017389768734574318, -0.015416072681546211, -0.013442376628518105, -0.011468679644167423, -0.009494983591139317, -0.00752128753811121, -0.0055475905537605286, -0.003573894500732422, -0.0016001947224140167, 0.0003735015634447336, 0.002347197849303484, 0.004320894367992878, 0.006294590421020985, 0.008268286474049091, 0.010241983458399773, 0.01221567951142788, 0.014189375564455986, 0.016163071617484093, 0.0181367676705122, 0.020110465586185455, 0.022084161639213562, 0.02405785769224167, 0.026031553745269775, 0.028005249798297882, 0.02997894585132599, 0.031952641904354095, 0.0339263379573822, 0.03590003401041031, 0.037873730063438416, 0.03984742611646652, 0.04182112216949463, 0.043794818222522736, 0.04576851427555084, 0.04774221032857895, 0.049715906381607056, 0.05168960243463516, 0.05366329848766327, 0.055636994540691376, 0.05761069059371948, 0.05958438664674759, 0.061558086425065994]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 6.0, 2.0, 11.0, 9.0, 14.0, 24.0, 39.0, 57.0, 78.0, 109.0, 139.0, 226.0, 308.0, 461.0, 629.0, 816.0, 1215.0, 1704.0, 2489.0, 3573.0, 5240.0, 7619.0, 11475.0, 17491.0, 27256.0, 45740.0, 79531.0, 150681.0, 268200.0, 184030.0, 94429.0, 53100.0, 30986.0, 20101.0, 12877.0, 8778.0, 5843.0, 4152.0, 2763.0, 1900.0, 1285.0, 966.0, 635.0, 468.0, 349.0, 224.0, 185.0, 119.0, 81.0, 47.0, 39.0, 23.0, 15.0, 14.0, 10.0, 5.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.03240966796875, -0.03138542175292969, -0.030361175537109375, -0.029336929321289062, -0.02831268310546875, -0.027288436889648438, -0.026264190673828125, -0.025239944458007812, -0.0242156982421875, -0.023191452026367188, -0.022167205810546875, -0.021142959594726562, -0.02011871337890625, -0.019094467163085938, -0.018070220947265625, -0.017045974731445312, -0.016021728515625, -0.014997482299804688, -0.013973236083984375, -0.012948989868164062, -0.01192474365234375, -0.010900497436523438, -0.009876251220703125, -0.008852005004882812, -0.0078277587890625, -0.0068035125732421875, -0.005779266357421875, -0.0047550201416015625, -0.00373077392578125, -0.0027065277099609375, -0.001682281494140625, -0.0006580352783203125, 0.0003662109375, 0.0013904571533203125, 0.002414703369140625, 0.0034389495849609375, 0.00446319580078125, 0.0054874420166015625, 0.006511688232421875, 0.0075359344482421875, 0.0085601806640625, 0.009584426879882812, 0.010608673095703125, 0.011632919311523438, 0.01265716552734375, 0.013681411743164062, 0.014705657958984375, 0.015729904174804688, 0.016754150390625, 0.017778396606445312, 0.018802642822265625, 0.019826889038085938, 0.02085113525390625, 0.021875381469726562, 0.022899627685546875, 0.023923873901367188, 0.0249481201171875, 0.025972366333007812, 0.026996612548828125, 0.028020858764648438, 0.02904510498046875, 0.030069351196289062, 0.031093597412109375, 0.03211784362792969, 0.03314208984375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 8.0, 5.0, 5.0, 6.0, 7.0, 10.0, 18.0, 17.0, 14.0, 11.0, 22.0, 23.0, 37.0, 21.0, 23.0, 30.0, 30.0, 43.0, 39.0, 40.0, 35.0, 45.0, 44.0, 32.0, 41.0, 42.0, 41.0, 39.0, 35.0, 21.0, 28.0, 27.0, 26.0, 25.0, 17.0, 9.0, 13.0, 8.0, 11.0, 10.0, 5.0, 11.0, 5.0, 9.0, 3.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.05560302734375, -0.053694725036621094, -0.05178642272949219, -0.04987812042236328, -0.047969818115234375, -0.04606151580810547, -0.04415321350097656, -0.042244911193847656, -0.04033660888671875, -0.038428306579589844, -0.03652000427246094, -0.03461170196533203, -0.032703399658203125, -0.03079509735107422, -0.028886795043945312, -0.026978492736816406, -0.0250701904296875, -0.023161888122558594, -0.021253585815429688, -0.01934528350830078, -0.017436981201171875, -0.015528678894042969, -0.013620376586914062, -0.011712074279785156, -0.00980377197265625, -0.007895469665527344, -0.0059871673583984375, -0.004078865051269531, -0.002170562744140625, -0.00026226043701171875, 0.0016460418701171875, 0.0035543441772460938, 0.005462646484375, 0.007370948791503906, 0.009279251098632812, 0.011187553405761719, 0.013095855712890625, 0.015004158020019531, 0.016912460327148438, 0.018820762634277344, 0.02072906494140625, 0.022637367248535156, 0.024545669555664062, 0.02645397186279297, 0.028362274169921875, 0.03027057647705078, 0.03217887878417969, 0.034087181091308594, 0.0359954833984375, 0.037903785705566406, 0.03981208801269531, 0.04172039031982422, 0.043628692626953125, 0.04553699493408203, 0.04744529724121094, 0.049353599548339844, 0.05126190185546875, 0.053170204162597656, 0.05507850646972656, 0.05698680877685547, 0.058895111083984375, 0.06080341339111328, 0.06271171569824219, 0.0646200180053711, 0.0665283203125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 8.0, 8.0, 11.0, 17.0, 27.0, 44.0, 72.0, 96.0, 128.0, 187.0, 290.0, 444.0, 654.0, 900.0, 1335.0, 2040.0, 3183.0, 5406.0, 9621.0, 19332.0, 51723.0, 223479.0, 557673.0, 106644.0, 32102.0, 13641.0, 7397.0, 4242.0, 2689.0, 1676.0, 1115.0, 782.0, 512.0, 324.0, 236.0, 142.0, 105.0, 63.0, 58.0, 47.0, 39.0, 16.0, 20.0, 10.0, 4.0, 10.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07904052734375, -0.07673454284667969, -0.07442855834960938, -0.07212257385253906, -0.06981658935546875, -0.06751060485839844, -0.06520462036132812, -0.06289863586425781, -0.0605926513671875, -0.05828666687011719, -0.055980682373046875, -0.05367469787597656, -0.05136871337890625, -0.04906272888183594, -0.046756744384765625, -0.04445075988769531, -0.042144775390625, -0.03983879089355469, -0.037532806396484375, -0.03522682189941406, -0.03292083740234375, -0.030614852905273438, -0.028308868408203125, -0.026002883911132812, -0.0236968994140625, -0.021390914916992188, -0.019084930419921875, -0.016778945922851562, -0.01447296142578125, -0.012166976928710938, -0.009860992431640625, -0.0075550079345703125, -0.0052490234375, -0.0029430389404296875, -0.000637054443359375, 0.0016689300537109375, 0.00397491455078125, 0.0062808990478515625, 0.008586883544921875, 0.010892868041992188, 0.0131988525390625, 0.015504837036132812, 0.017810821533203125, 0.020116806030273438, 0.02242279052734375, 0.024728775024414062, 0.027034759521484375, 0.029340744018554688, 0.031646728515625, 0.03395271301269531, 0.036258697509765625, 0.03856468200683594, 0.04087066650390625, 0.04317665100097656, 0.045482635498046875, 0.04778861999511719, 0.0500946044921875, 0.05240058898925781, 0.054706573486328125, 0.05701255798339844, 0.05931854248046875, 0.06162452697753906, 0.06393051147460938, 0.06623649597167969, 0.06854248046875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 5.0, 2.0, 3.0, 5.0, 8.0, 5.0, 22.0, 10.0, 17.0, 20.0, 30.0, 23.0, 42.0, 28.0, 32.0, 28.0, 46.0, 52.0, 50.0, 63.0, 56.0, 56.0, 45.0, 45.0, 44.0, 47.0, 35.0, 20.0, 32.0, 30.0, 16.0, 25.0, 19.0, 8.0, 13.0, 7.0, 6.0, 7.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03997802734375, -0.038457393646240234, -0.03693675994873047, -0.0354161262512207, -0.03389549255371094, -0.03237485885620117, -0.030854225158691406, -0.02933359146118164, -0.027812957763671875, -0.02629232406616211, -0.024771690368652344, -0.023251056671142578, -0.021730422973632812, -0.020209789276123047, -0.01868915557861328, -0.017168521881103516, -0.01564788818359375, -0.014127254486083984, -0.012606620788574219, -0.011085987091064453, -0.009565353393554688, -0.008044719696044922, -0.006524085998535156, -0.005003452301025391, -0.003482818603515625, -0.0019621849060058594, -0.00044155120849609375, 0.0010790824890136719, 0.0025997161865234375, 0.004120349884033203, 0.005640983581542969, 0.007161617279052734, 0.0086822509765625, 0.010202884674072266, 0.011723518371582031, 0.013244152069091797, 0.014764785766601562, 0.016285419464111328, 0.017806053161621094, 0.01932668685913086, 0.020847320556640625, 0.02236795425415039, 0.023888587951660156, 0.025409221649169922, 0.026929855346679688, 0.028450489044189453, 0.02997112274169922, 0.031491756439208984, 0.03301239013671875, 0.034533023834228516, 0.03605365753173828, 0.03757429122924805, 0.03909492492675781, 0.04061555862426758, 0.042136192321777344, 0.04365682601928711, 0.045177459716796875, 0.04669809341430664, 0.048218727111816406, 0.04973936080932617, 0.05125999450683594, 0.0527806282043457, 0.05430126190185547, 0.055821895599365234, 0.057342529296875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 5.0, 7.0, 19.0, 17.0, 19.0, 27.0, 48.0, 62.0, 54.0, 95.0, 115.0, 164.0, 209.0, 328.0, 473.0, 703.0, 1081.0, 1772.0, 2980.0, 5105.0, 9885.0, 22227.0, 68132.0, 561108.0, 285998.0, 49840.0, 17992.0, 8249.0, 4427.0, 2606.0, 1607.0, 1043.0, 668.0, 424.0, 293.0, 226.0, 151.0, 111.0, 69.0, 60.0, 39.0, 32.0, 25.0, 12.0, 7.0, 10.0, 11.0, 6.0, 2.0, 2.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.006580352783203125, -0.0063672661781311035, -0.006154179573059082, -0.0059410929679870605, -0.005728006362915039, -0.005514919757843018, -0.005301833152770996, -0.005088746547698975, -0.004875659942626953, -0.004662573337554932, -0.00444948673248291, -0.004236400127410889, -0.004023313522338867, -0.0038102269172668457, -0.0035971403121948242, -0.0033840537071228027, -0.0031709671020507812, -0.0029578804969787598, -0.0027447938919067383, -0.002531707286834717, -0.0023186206817626953, -0.002105534076690674, -0.0018924474716186523, -0.0016793608665466309, -0.0014662742614746094, -0.0012531876564025879, -0.0010401010513305664, -0.0008270144462585449, -0.0006139278411865234, -0.00040084123611450195, -0.00018775463104248047, 2.5331974029541016e-05, 0.0002384185791015625, 0.000451505184173584, 0.0006645917892456055, 0.000877678394317627, 0.0010907649993896484, 0.00130385160446167, 0.0015169382095336914, 0.0017300248146057129, 0.0019431114196777344, 0.002156198024749756, 0.0023692846298217773, 0.002582371234893799, 0.0027954578399658203, 0.003008544445037842, 0.0032216310501098633, 0.0034347176551818848, 0.0036478042602539062, 0.0038608908653259277, 0.004073977470397949, 0.004287064075469971, 0.004500150680541992, 0.004713237285614014, 0.004926323890686035, 0.005139410495758057, 0.005352497100830078, 0.0055655837059021, 0.005778670310974121, 0.005991756916046143, 0.006204843521118164, 0.0064179301261901855, 0.006631016731262207, 0.0068441033363342285, 0.00705718994140625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 0.0, 3.0, 6.0, 0.0, 13.0, 0.0, 24.0, 0.0, 19.0, 48.0, 0.0, 53.0, 0.0, 68.0, 0.0, 95.0, 0.0, 106.0, 136.0, 0.0, 107.0, 0.0, 94.0, 0.0, 71.0, 55.0, 0.0, 45.0, 0.0, 18.0, 0.0, 13.0, 0.0, 12.0, 11.0, 0.0, 5.0, 0.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1324882507324219e-06, -1.0989606380462646e-06, -1.0654330253601074e-06, -1.0319054126739502e-06, -9.98377799987793e-07, -9.648501873016357e-07, -9.313225746154785e-07, -8.977949619293213e-07, -8.642673492431641e-07, -8.307397365570068e-07, -7.972121238708496e-07, -7.636845111846924e-07, -7.301568984985352e-07, -6.966292858123779e-07, -6.631016731262207e-07, -6.295740604400635e-07, -5.960464477539062e-07, -5.62518835067749e-07, -5.289912223815918e-07, -4.954636096954346e-07, -4.6193599700927734e-07, -4.284083843231201e-07, -3.948807716369629e-07, -3.6135315895080566e-07, -3.2782554626464844e-07, -2.942979335784912e-07, -2.60770320892334e-07, -2.2724270820617676e-07, -1.9371509552001953e-07, -1.601874828338623e-07, -1.2665987014770508e-07, -9.313225746154785e-08, -5.960464477539063e-08, -2.60770320892334e-08, 7.450580596923828e-09, 4.0978193283081055e-08, 7.450580596923828e-08, 1.0803341865539551e-07, 1.4156103134155273e-07, 1.7508864402770996e-07, 2.086162567138672e-07, 2.421438694000244e-07, 2.7567148208618164e-07, 3.0919909477233887e-07, 3.427267074584961e-07, 3.762543201446533e-07, 4.0978193283081055e-07, 4.4330954551696777e-07, 4.76837158203125e-07, 5.103647708892822e-07, 5.438923835754395e-07, 5.774199962615967e-07, 6.109476089477539e-07, 6.444752216339111e-07, 6.780028343200684e-07, 7.115304470062256e-07, 7.450580596923828e-07, 7.7858567237854e-07, 8.121132850646973e-07, 8.456408977508545e-07, 8.791685104370117e-07, 9.126961231231689e-07, 9.462237358093262e-07, 9.797513484954834e-07, 1.0132789611816406e-06]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 6.0, 14.0, 10.0, 25.0, 33.0, 26.0, 52.0, 61.0, 99.0, 109.0, 176.0, 254.0, 376.0, 591.0, 864.0, 1591.0, 2702.0, 5327.0, 10866.0, 23847.0, 64408.0, 246614.0, 507924.0, 113553.0, 37033.0, 15487.0, 7358.0, 3712.0, 2043.0, 1170.0, 717.0, 438.0, 336.0, 210.0, 143.0, 90.0, 75.0, 54.0, 41.0, 39.0, 18.0, 13.0, 14.0, 8.0, 7.0, 8.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005687713623046875, -0.0054931640625, -0.005298614501953125, -0.00510406494140625, -0.004909515380859375, -0.0047149658203125, -0.004520416259765625, -0.00432586669921875, -0.004131317138671875, -0.003936767578125, -0.003742218017578125, -0.00354766845703125, -0.003353118896484375, -0.0031585693359375, -0.002964019775390625, -0.00276947021484375, -0.002574920654296875, -0.00238037109375, -0.002185821533203125, -0.00199127197265625, -0.001796722412109375, -0.0016021728515625, -0.001407623291015625, -0.00121307373046875, -0.001018524169921875, -0.000823974609375, -0.000629425048828125, -0.00043487548828125, -0.000240325927734375, -4.57763671875e-05, 0.000148773193359375, 0.00034332275390625, 0.000537872314453125, 0.000732421875, 0.000926971435546875, 0.00112152099609375, 0.001316070556640625, 0.0015106201171875, 0.001705169677734375, 0.00189971923828125, 0.002094268798828125, 0.002288818359375, 0.002483367919921875, 0.00267791748046875, 0.002872467041015625, 0.0030670166015625, 0.003261566162109375, 0.00345611572265625, 0.003650665283203125, 0.00384521484375, 0.004039764404296875, 0.00423431396484375, 0.004428863525390625, 0.0046234130859375, 0.004817962646484375, 0.00501251220703125, 0.005207061767578125, 0.005401611328125, 0.005596160888671875, 0.00579071044921875, 0.005985260009765625, 0.0061798095703125, 0.006374359130859375, 0.00656890869140625, 0.006763458251953125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 0.0, 6.0, 5.0, 7.0, 5.0, 6.0, 8.0, 10.0, 14.0, 22.0, 28.0, 40.0, 60.0, 110.0, 173.0, 191.0, 104.0, 62.0, 30.0, 34.0, 23.0, 15.0, 13.0, 8.0, 10.0, 6.0, 2.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0026264190673828125, -0.0025535225868225098, -0.002480626106262207, -0.0024077296257019043, -0.0023348331451416016, -0.002261936664581299, -0.002189040184020996, -0.0021161437034606934, -0.0020432472229003906, -0.001970350742340088, -0.0018974542617797852, -0.0018245577812194824, -0.0017516613006591797, -0.001678764820098877, -0.0016058683395385742, -0.0015329718589782715, -0.0014600753784179688, -0.001387178897857666, -0.0013142824172973633, -0.0012413859367370605, -0.0011684894561767578, -0.001095592975616455, -0.0010226964950561523, -0.0009498000144958496, -0.0008769035339355469, -0.0008040070533752441, -0.0007311105728149414, -0.0006582140922546387, -0.0005853176116943359, -0.0005124211311340332, -0.00043952465057373047, -0.00036662817001342773, -0.000293731689453125, -0.00022083520889282227, -0.00014793872833251953, -7.50422477722168e-05, -2.1457672119140625e-06, 7.075071334838867e-05, 0.0001436471939086914, 0.00021654367446899414, 0.0002894401550292969, 0.0003623366355895996, 0.00043523311614990234, 0.0005081295967102051, 0.0005810260772705078, 0.0006539225578308105, 0.0007268190383911133, 0.000799715518951416, 0.0008726119995117188, 0.0009455084800720215, 0.0010184049606323242, 0.001091301441192627, 0.0011641979217529297, 0.0012370944023132324, 0.0013099908828735352, 0.0013828873634338379, 0.0014557838439941406, 0.0015286803245544434, 0.001601576805114746, 0.0016744732856750488, 0.0017473697662353516, 0.0018202662467956543, 0.001893162727355957, 0.0019660592079162598, 0.0020389556884765625]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 4.0, 8.0, 6.0, 11.0, 12.0, 13.0, 6.0, 14.0, 12.0, 36.0, 39.0, 55.0, 57.0, 93.0, 97.0, 87.0, 89.0, 75.0, 59.0, 42.0, 26.0, 24.0, 29.0, 23.0, 10.0, 9.0, 14.0, 6.0, 5.0, 8.0, 10.0, 6.0, 0.0, 6.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0939144715666771, -0.09102220088243484, -0.0881299301981926, -0.08523765951395035, -0.0823453888297081, -0.07945311814546585, -0.0765608549118042, -0.07366858422756195, -0.0707763135433197, -0.06788404285907745, -0.0649917721748352, -0.06209950149059296, -0.05920723080635071, -0.05631496012210846, -0.05342269316315651, -0.05053042247891426, -0.047638148069381714, -0.044745877385139465, -0.04185360670089722, -0.03896133601665497, -0.03606906533241272, -0.03317679464817047, -0.03028452768921852, -0.027392257004976273, -0.024499986320734024, -0.021607715636491776, -0.018715444952249527, -0.015823176130652428, -0.01293090544641018, -0.01003863476216793, -0.007146365940570831, -0.004254095256328583, -0.0013618171215057373, 0.001530453097075224, 0.004422723315656185, 0.007314993068575859, 0.010207263752818108, 0.013099534437060356, 0.015991803258657455, 0.018884073942899704, 0.021776344627141953, 0.0246686153113842, 0.02756088599562645, 0.03045315481722355, 0.03334542363882065, 0.0362376943230629, 0.039129965007305145, 0.042022235691547394, 0.04491450637578964, 0.04780677706003189, 0.05069904774427414, 0.05359131842851639, 0.056483589112758636, 0.059375859797000885, 0.062268126755952835, 0.06516039371490479, 0.06805266439914703, 0.07094493508338928, 0.07383720576763153, 0.07672947645187378, 0.07962174713611603, 0.08251401782035828, 0.08540628850460052, 0.08829855918884277, 0.09119082987308502]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 1.0, 3.0, 3.0, 10.0, 15.0, 11.0, 8.0, 10.0, 17.0, 15.0, 11.0, 22.0, 24.0, 32.0, 32.0, 20.0, 25.0, 32.0, 31.0, 32.0, 43.0, 43.0, 54.0, 36.0, 36.0, 41.0, 38.0, 43.0, 34.0, 34.0, 39.0, 28.0, 25.0, 29.0, 18.0, 13.0, 17.0, 16.0, 16.0, 7.0, 11.0, 4.0, 9.0, 5.0, 4.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.06502582132816315, -0.06305941194295883, -0.06109299883246422, -0.059126585721969604, -0.05716017633676529, -0.055193766951560974, -0.05322735384106636, -0.05126094073057175, -0.04929453134536743, -0.047328121960163116, -0.0453617088496685, -0.04339529573917389, -0.041428886353969574, -0.03946247696876526, -0.037496063858270645, -0.03552965074777603, -0.033563241362571716, -0.0315968319773674, -0.029630418866872787, -0.027664007619023323, -0.02569759637117386, -0.023731185123324394, -0.02176477387547493, -0.019798362627625465, -0.017831951379776, -0.015865540131926537, -0.013899128884077072, -0.011932717636227608, -0.009966306388378143, -0.007999895140528679, -0.0060334838926792145, -0.00406707264482975, -0.0021006539463996887, -0.0001342426985502243, 0.0018321685492992401, 0.0037985797971487045, 0.005764991044998169, 0.007731402292847633, 0.009697813540697098, 0.011664224788546562, 0.013630636036396027, 0.015597047284245491, 0.017563458532094955, 0.01952986977994442, 0.021496281027793884, 0.02346269227564335, 0.025429103523492813, 0.027395514771342278, 0.029361926019191742, 0.03132833540439606, 0.03329474851489067, 0.035261161625385284, 0.0372275710105896, 0.039193980395793915, 0.04116039350628853, 0.04312680661678314, 0.04509321600198746, 0.04705962538719177, 0.049026038497686386, 0.050992451608181, 0.052958860993385315, 0.05492527037858963, 0.056891683489084244, 0.05885809659957886, 0.06082450598478317]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 6.0, 8.0, 3.0, 15.0, 16.0, 40.0, 47.0, 66.0, 95.0, 140.0, 215.0, 373.0, 518.0, 754.0, 1190.0, 1808.0, 2700.0, 4093.0, 6289.0, 9575.0, 15025.0, 23796.0, 40079.0, 71613.0, 142722.0, 297263.0, 203320.0, 94785.0, 50781.0, 29452.0, 18044.0, 11723.0, 7334.0, 5021.0, 3293.0, 2166.0, 1382.0, 975.0, 615.0, 425.0, 260.0, 183.0, 114.0, 82.0, 46.0, 34.0, 27.0, 17.0, 12.0, 8.0, 7.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1287841796875, -0.12472343444824219, -0.12066268920898438, -0.11660194396972656, -0.11254119873046875, -0.10848045349121094, -0.10441970825195312, -0.10035896301269531, -0.0962982177734375, -0.09223747253417969, -0.08817672729492188, -0.08411598205566406, -0.08005523681640625, -0.07599449157714844, -0.07193374633789062, -0.06787300109863281, -0.063812255859375, -0.05975151062011719, -0.055690765380859375, -0.05163002014160156, -0.04756927490234375, -0.04350852966308594, -0.039447784423828125, -0.03538703918457031, -0.0313262939453125, -0.027265548706054688, -0.023204803466796875, -0.019144058227539062, -0.01508331298828125, -0.011022567749023438, -0.006961822509765625, -0.0029010772705078125, 0.00115966796875, 0.0052204132080078125, 0.009281158447265625, 0.013341903686523438, 0.01740264892578125, 0.021463394165039062, 0.025524139404296875, 0.029584884643554688, 0.0336456298828125, 0.03770637512207031, 0.041767120361328125, 0.04582786560058594, 0.04988861083984375, 0.05394935607910156, 0.058010101318359375, 0.06207084655761719, 0.066131591796875, 0.07019233703613281, 0.07425308227539062, 0.07831382751464844, 0.08237457275390625, 0.08643531799316406, 0.09049606323242188, 0.09455680847167969, 0.0986175537109375, 0.10267829895019531, 0.10673904418945312, 0.11079978942871094, 0.11486053466796875, 0.11892127990722656, 0.12298202514648438, 0.1270427703857422, 0.131103515625]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 4.0, 2.0, 1.0, 3.0, 1.0, 10.0, 10.0, 7.0, 6.0, 5.0, 10.0, 19.0, 14.0, 15.0, 13.0, 24.0, 26.0, 22.0, 19.0, 33.0, 33.0, 28.0, 37.0, 42.0, 42.0, 51.0, 41.0, 35.0, 45.0, 42.0, 39.0, 42.0, 34.0, 44.0, 26.0, 27.0, 22.0, 19.0, 14.0, 21.0, 11.0, 15.0, 12.0, 5.0, 9.0, 11.0, 3.0, 10.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050872802734375, -0.04914999008178711, -0.04742717742919922, -0.04570436477661133, -0.04398155212402344, -0.04225873947143555, -0.040535926818847656, -0.038813114166259766, -0.037090301513671875, -0.035367488861083984, -0.033644676208496094, -0.0319218635559082, -0.030199050903320312, -0.028476238250732422, -0.02675342559814453, -0.02503061294555664, -0.02330780029296875, -0.02158498764038086, -0.01986217498779297, -0.018139362335205078, -0.016416549682617188, -0.014693737030029297, -0.012970924377441406, -0.011248111724853516, -0.009525299072265625, -0.007802486419677734, -0.006079673767089844, -0.004356861114501953, -0.0026340484619140625, -0.0009112358093261719, 0.0008115768432617188, 0.0025343894958496094, 0.0042572021484375, 0.005980014801025391, 0.007702827453613281, 0.009425640106201172, 0.011148452758789062, 0.012871265411376953, 0.014594078063964844, 0.016316890716552734, 0.018039703369140625, 0.019762516021728516, 0.021485328674316406, 0.023208141326904297, 0.024930953979492188, 0.026653766632080078, 0.02837657928466797, 0.03009939193725586, 0.03182220458984375, 0.03354501724243164, 0.03526782989501953, 0.03699064254760742, 0.03871345520019531, 0.0404362678527832, 0.042159080505371094, 0.043881893157958984, 0.045604705810546875, 0.047327518463134766, 0.049050331115722656, 0.05077314376831055, 0.05249595642089844, 0.05421876907348633, 0.05594158172607422, 0.05766439437866211, 0.05938720703125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 5.0, 8.0, 10.0, 15.0, 20.0, 34.0, 48.0, 89.0, 112.0, 183.0, 243.0, 418.0, 600.0, 841.0, 1285.0, 1859.0, 2781.0, 4077.0, 6158.0, 9395.0, 14085.0, 21798.0, 34321.0, 54260.0, 90104.0, 158210.0, 260659.0, 151875.0, 87030.0, 52957.0, 32950.0, 21179.0, 13634.0, 8925.0, 5886.0, 4107.0, 2747.0, 1813.0, 1216.0, 823.0, 581.0, 383.0, 287.0, 191.0, 128.0, 79.0, 50.0, 35.0, 28.0, 20.0, 9.0, 5.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.11944580078125, -0.11598014831542969, -0.11251449584960938, -0.10904884338378906, -0.10558319091796875, -0.10211753845214844, -0.09865188598632812, -0.09518623352050781, -0.0917205810546875, -0.08825492858886719, -0.08478927612304688, -0.08132362365722656, -0.07785797119140625, -0.07439231872558594, -0.07092666625976562, -0.06746101379394531, -0.063995361328125, -0.06052970886230469, -0.057064056396484375, -0.05359840393066406, -0.05013275146484375, -0.04666709899902344, -0.043201446533203125, -0.03973579406738281, -0.0362701416015625, -0.03280448913574219, -0.029338836669921875, -0.025873184204101562, -0.02240753173828125, -0.018941879272460938, -0.015476226806640625, -0.012010574340820312, -0.008544921875, -0.0050792694091796875, -0.001613616943359375, 0.0018520355224609375, 0.00531768798828125, 0.008783340454101562, 0.012248992919921875, 0.015714645385742188, 0.0191802978515625, 0.022645950317382812, 0.026111602783203125, 0.029577255249023438, 0.03304290771484375, 0.03650856018066406, 0.039974212646484375, 0.04343986511230469, 0.046905517578125, 0.05037117004394531, 0.053836822509765625, 0.05730247497558594, 0.06076812744140625, 0.06423377990722656, 0.06769943237304688, 0.07116508483886719, 0.0746307373046875, 0.07809638977050781, 0.08156204223632812, 0.08502769470214844, 0.08849334716796875, 0.09195899963378906, 0.09542465209960938, 0.09889030456542969, 0.10235595703125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 4.0, 3.0, 6.0, 7.0, 10.0, 13.0, 11.0, 17.0, 19.0, 27.0, 19.0, 21.0, 29.0, 35.0, 32.0, 28.0, 23.0, 38.0, 36.0, 40.0, 36.0, 50.0, 33.0, 35.0, 40.0, 29.0, 37.0, 41.0, 29.0, 35.0, 45.0, 22.0, 28.0, 18.0, 13.0, 21.0, 11.0, 11.0, 8.0, 8.0, 6.0, 9.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.033599853515625, -0.032501220703125, -0.031402587890625, -0.030303955078125, -0.029205322265625, -0.028106689453125, -0.027008056640625, -0.025909423828125, -0.024810791015625, -0.023712158203125, -0.022613525390625, -0.021514892578125, -0.020416259765625, -0.019317626953125, -0.018218994140625, -0.017120361328125, -0.016021728515625, -0.014923095703125, -0.013824462890625, -0.012725830078125, -0.011627197265625, -0.010528564453125, -0.009429931640625, -0.008331298828125, -0.007232666015625, -0.006134033203125, -0.005035400390625, -0.003936767578125, -0.002838134765625, -0.001739501953125, -0.000640869140625, 0.000457763671875, 0.001556396484375, 0.002655029296875, 0.003753662109375, 0.004852294921875, 0.005950927734375, 0.007049560546875, 0.008148193359375, 0.009246826171875, 0.010345458984375, 0.011444091796875, 0.012542724609375, 0.013641357421875, 0.014739990234375, 0.015838623046875, 0.016937255859375, 0.018035888671875, 0.019134521484375, 0.020233154296875, 0.021331787109375, 0.022430419921875, 0.023529052734375, 0.024627685546875, 0.025726318359375, 0.026824951171875, 0.027923583984375, 0.029022216796875, 0.030120849609375, 0.031219482421875, 0.032318115234375, 0.033416748046875, 0.034515380859375, 0.035614013671875, 0.036712646484375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 4.0, 1.0, 6.0, 9.0, 6.0, 11.0, 12.0, 17.0, 27.0, 43.0, 49.0, 55.0, 85.0, 99.0, 130.0, 176.0, 218.0, 291.0, 379.0, 502.0, 645.0, 926.0, 1262.0, 1660.0, 2272.0, 3306.0, 5139.0, 13133.0, 964196.0, 33424.0, 6694.0, 3811.0, 2647.0, 1924.0, 1383.0, 1004.0, 715.0, 530.0, 408.0, 322.0, 242.0, 171.0, 141.0, 127.0, 89.0, 76.0, 41.0, 45.0, 28.0, 18.0, 16.0, 15.0, 9.0, 9.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0], "bins": [-0.035400390625, -0.03428316116333008, -0.033165931701660156, -0.032048702239990234, -0.030931472778320312, -0.02981424331665039, -0.02869701385498047, -0.027579784393310547, -0.026462554931640625, -0.025345325469970703, -0.02422809600830078, -0.02311086654663086, -0.021993637084960938, -0.020876407623291016, -0.019759178161621094, -0.018641948699951172, -0.01752471923828125, -0.016407489776611328, -0.015290260314941406, -0.014173030853271484, -0.013055801391601562, -0.01193857192993164, -0.010821342468261719, -0.009704113006591797, -0.008586883544921875, -0.007469654083251953, -0.006352424621582031, -0.005235195159912109, -0.0041179656982421875, -0.0030007362365722656, -0.0018835067749023438, -0.0007662773132324219, 0.0003509521484375, 0.0014681816101074219, 0.0025854110717773438, 0.0037026405334472656, 0.0048198699951171875, 0.005937099456787109, 0.007054328918457031, 0.008171558380126953, 0.009288787841796875, 0.010406017303466797, 0.011523246765136719, 0.01264047622680664, 0.013757705688476562, 0.014874935150146484, 0.015992164611816406, 0.017109394073486328, 0.01822662353515625, 0.019343852996826172, 0.020461082458496094, 0.021578311920166016, 0.022695541381835938, 0.02381277084350586, 0.02493000030517578, 0.026047229766845703, 0.027164459228515625, 0.028281688690185547, 0.02939891815185547, 0.03051614761352539, 0.03163337707519531, 0.032750606536865234, 0.033867835998535156, 0.03498506546020508, 0.036102294921875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 7.0, 5.0, 14.0, 20.0, 64.0, 67.0, 107.0, 138.0, 164.0, 0.0, 155.0, 91.0, 77.0, 43.0, 17.0, 13.0, 11.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6689300537109375e-06, -1.6149133443832397e-06, -1.560896635055542e-06, -1.5068799257278442e-06, -1.4528632164001465e-06, -1.3988465070724487e-06, -1.344829797744751e-06, -1.2908130884170532e-06, -1.2367963790893555e-06, -1.1827796697616577e-06, -1.12876296043396e-06, -1.0747462511062622e-06, -1.0207295417785645e-06, -9.667128324508667e-07, -9.126961231231689e-07, -8.586794137954712e-07, -8.046627044677734e-07, -7.506459951400757e-07, -6.966292858123779e-07, -6.426125764846802e-07, -5.885958671569824e-07, -5.345791578292847e-07, -4.805624485015869e-07, -4.2654573917388916e-07, -3.725290298461914e-07, -3.1851232051849365e-07, -2.644956111907959e-07, -2.1047890186309814e-07, -1.564621925354004e-07, -1.0244548320770264e-07, -4.842877388000488e-08, 5.587935447692871e-09, 5.960464477539063e-08, 1.1362135410308838e-07, 1.6763806343078613e-07, 2.2165477275848389e-07, 2.7567148208618164e-07, 3.296881914138794e-07, 3.8370490074157715e-07, 4.377216100692749e-07, 4.917383193969727e-07, 5.457550287246704e-07, 5.997717380523682e-07, 6.537884473800659e-07, 7.078051567077637e-07, 7.618218660354614e-07, 8.158385753631592e-07, 8.698552846908569e-07, 9.238719940185547e-07, 9.778887033462524e-07, 1.0319054126739502e-06, 1.085922122001648e-06, 1.1399388313293457e-06, 1.1939555406570435e-06, 1.2479722499847412e-06, 1.301988959312439e-06, 1.3560056686401367e-06, 1.4100223779678345e-06, 1.4640390872955322e-06, 1.51805579662323e-06, 1.5720725059509277e-06, 1.6260892152786255e-06, 1.6801059246063232e-06, 1.734122633934021e-06, 1.7881393432617188e-06]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 10.0, 12.0, 14.0, 15.0, 22.0, 23.0, 55.0, 74.0, 123.0, 130.0, 218.0, 350.0, 476.0, 639.0, 896.0, 1262.0, 1842.0, 2666.0, 4289.0, 9835.0, 950893.0, 56524.0, 6747.0, 3575.0, 2345.0, 1594.0, 1192.0, 820.0, 570.0, 396.0, 278.0, 191.0, 141.0, 108.0, 72.0, 51.0, 27.0, 27.0, 15.0, 9.0, 14.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.040863037109375, -0.039537906646728516, -0.03821277618408203, -0.03688764572143555, -0.03556251525878906, -0.03423738479614258, -0.032912254333496094, -0.03158712387084961, -0.030261993408203125, -0.02893686294555664, -0.027611732482910156, -0.026286602020263672, -0.024961471557617188, -0.023636341094970703, -0.02231121063232422, -0.020986080169677734, -0.01966094970703125, -0.018335819244384766, -0.01701068878173828, -0.015685558319091797, -0.014360427856445312, -0.013035297393798828, -0.011710166931152344, -0.01038503646850586, -0.009059906005859375, -0.007734775543212891, -0.006409645080566406, -0.005084514617919922, -0.0037593841552734375, -0.002434253692626953, -0.0011091232299804688, 0.00021600723266601562, 0.0015411376953125, 0.0028662681579589844, 0.004191398620605469, 0.005516529083251953, 0.0068416595458984375, 0.008166790008544922, 0.009491920471191406, 0.01081705093383789, 0.012142181396484375, 0.01346731185913086, 0.014792442321777344, 0.016117572784423828, 0.017442703247070312, 0.018767833709716797, 0.02009296417236328, 0.021418094635009766, 0.02274322509765625, 0.024068355560302734, 0.02539348602294922, 0.026718616485595703, 0.028043746948242188, 0.029368877410888672, 0.030694007873535156, 0.03201913833618164, 0.033344268798828125, 0.03466939926147461, 0.035994529724121094, 0.03731966018676758, 0.03864479064941406, 0.03996992111206055, 0.04129505157470703, 0.042620182037353516, 0.0439453125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 12.0, 34.0, 607.0, 287.0, 18.0, 10.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01183319091796875, -0.011484622955322266, -0.011136054992675781, -0.010787487030029297, -0.010438919067382812, -0.010090351104736328, -0.009741783142089844, -0.00939321517944336, -0.009044647216796875, -0.00869607925415039, -0.008347511291503906, -0.007998943328857422, -0.0076503753662109375, -0.007301807403564453, -0.006953239440917969, -0.006604671478271484, -0.006256103515625, -0.005907535552978516, -0.005558967590332031, -0.005210399627685547, -0.0048618316650390625, -0.004513263702392578, -0.004164695739746094, -0.0038161277770996094, -0.003467559814453125, -0.0031189918518066406, -0.0027704238891601562, -0.002421855926513672, -0.0020732879638671875, -0.0017247200012207031, -0.0013761520385742188, -0.0010275840759277344, -0.00067901611328125, -0.0003304481506347656, 1.811981201171875e-05, 0.0003666877746582031, 0.0007152557373046875, 0.0010638236999511719, 0.0014123916625976562, 0.0017609596252441406, 0.002109527587890625, 0.0024580955505371094, 0.0028066635131835938, 0.003155231475830078, 0.0035037994384765625, 0.003852367401123047, 0.004200935363769531, 0.004549503326416016, 0.0048980712890625, 0.005246639251708984, 0.005595207214355469, 0.005943775177001953, 0.0062923431396484375, 0.006640911102294922, 0.006989479064941406, 0.007338047027587891, 0.007686614990234375, 0.00803518295288086, 0.008383750915527344, 0.008732318878173828, 0.009080886840820312, 0.009429454803466797, 0.009778022766113281, 0.010126590728759766, 0.01047515869140625]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 4.0, 7.0, 3.0, 5.0, 7.0, 12.0, 12.0, 12.0, 17.0, 39.0, 31.0, 38.0, 62.0, 83.0, 90.0, 109.0, 97.0, 70.0, 61.0, 46.0, 42.0, 24.0, 26.0, 28.0, 12.0, 11.0, 14.0, 10.0, 5.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09459031373262405, -0.09187114983797073, -0.08915199339389801, -0.08643282949924469, -0.08371366560459137, -0.08099450170993805, -0.07827533781528473, -0.075556181371212, -0.07283701747655869, -0.07011785358190536, -0.06739869713783264, -0.06467953324317932, -0.061960369348526, -0.05924120545387268, -0.05652204528450966, -0.05380288511514664, -0.05108372122049332, -0.048364557325839996, -0.045645397156476974, -0.04292623698711395, -0.04020707309246063, -0.03748790919780731, -0.03476874902844429, -0.03204958885908127, -0.029330424964427948, -0.026611262932419777, -0.023892100900411606, -0.021172938868403435, -0.018453776836395264, -0.015734614804387093, -0.013015452772378922, -0.01029629074037075, -0.007577121257781982, -0.004857959225773811, -0.0021387971937656403, 0.0005803648382425308, 0.003299526870250702, 0.006018688902258873, 0.008737850934267044, 0.011457012966275215, 0.014176174998283386, 0.016895337030291557, 0.01961449906229973, 0.0223336610943079, 0.02505282312631607, 0.02777198515832424, 0.030491147190332413, 0.033210307359695435, 0.035929471254348755, 0.038648635149002075, 0.0413677953183651, 0.04408695548772812, 0.04680611938238144, 0.04952528327703476, 0.05224444344639778, 0.0549636036157608, 0.057682767510414124, 0.060401931405067444, 0.06312109529972076, 0.06584025174379349, 0.06855941563844681, 0.07127857953310013, 0.07399773597717285, 0.07671689987182617, 0.07943606376647949]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 2.0, 11.0, 7.0, 17.0, 11.0, 15.0, 14.0, 16.0, 15.0, 31.0, 23.0, 20.0, 27.0, 33.0, 29.0, 42.0, 45.0, 45.0, 31.0, 45.0, 32.0, 45.0, 54.0, 40.0, 37.0, 41.0, 38.0, 28.0, 29.0, 36.0, 18.0, 25.0, 14.0, 11.0, 17.0, 11.0, 7.0, 7.0, 7.0, 7.0, 3.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.05530207231640816, -0.0533895343542099, -0.05147700011730194, -0.04956446588039398, -0.047651927918195724, -0.04573938995599747, -0.04382685571908951, -0.04191432148218155, -0.04000178351998329, -0.038089245557785034, -0.036176711320877075, -0.034264177083969116, -0.03235163912177086, -0.03043910302221775, -0.028526566922664642, -0.026614030823111534, -0.024701494723558426, -0.022788958624005318, -0.02087642252445221, -0.0189638864248991, -0.017051350325345993, -0.015138814225792885, -0.013226278126239777, -0.011313742026686668, -0.00940120592713356, -0.007488669827580452, -0.005576133728027344, -0.0036635976284742355, -0.0017510615289211273, 0.0001614745706319809, 0.002074010670185089, 0.003986546769738197, 0.005899086594581604, 0.007811622694134712, 0.00972415879368782, 0.011636694893240929, 0.013549230992794037, 0.015461767092347145, 0.017374303191900253, 0.01928683929145336, 0.02119937539100647, 0.023111911490559578, 0.025024447590112686, 0.026936983689665794, 0.028849519789218903, 0.03076205588877201, 0.03267459198832512, 0.034587129950523376, 0.036499664187431335, 0.038412198424339294, 0.04032473638653755, 0.04223727434873581, 0.04414980858564377, 0.04606234282255173, 0.047974880784749985, 0.04988741874694824, 0.0517999529838562, 0.05371248722076416, 0.05562502518296242, 0.057537563145160675, 0.059450097382068634, 0.06136263161897659, 0.06327517330646515, 0.06518770754337311, 0.06710024178028107]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 3.0, 9.0, 11.0, 20.0, 18.0, 21.0, 42.0, 63.0, 91.0, 91.0, 143.0, 220.0, 315.0, 427.0, 625.0, 859.0, 1218.0, 1898.0, 2736.0, 4015.0, 5874.0, 9255.0, 14279.0, 22680.0, 38605.0, 67367.0, 129687.0, 300059.0, 1102357.0, 1637441.0, 460883.0, 175521.0, 88781.0, 49166.0, 29173.0, 17669.0, 11196.0, 7191.0, 4732.0, 3072.0, 2093.0, 1380.0, 964.0, 656.0, 440.0, 286.0, 221.0, 152.0, 107.0, 71.0, 32.0, 31.0, 21.0, 12.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.08343505859375, -0.08092117309570312, -0.07840728759765625, -0.07589340209960938, -0.0733795166015625, -0.07086563110351562, -0.06835174560546875, -0.06583786010742188, -0.063323974609375, -0.060810089111328125, -0.05829620361328125, -0.055782318115234375, -0.0532684326171875, -0.050754547119140625, -0.04824066162109375, -0.045726776123046875, -0.043212890625, -0.040699005126953125, -0.03818511962890625, -0.035671234130859375, -0.0331573486328125, -0.030643463134765625, -0.02812957763671875, -0.025615692138671875, -0.023101806640625, -0.020587921142578125, -0.01807403564453125, -0.015560150146484375, -0.0130462646484375, -0.010532379150390625, -0.00801849365234375, -0.005504608154296875, -0.00299072265625, -0.000476837158203125, 0.00203704833984375, 0.004550933837890625, 0.0070648193359375, 0.009578704833984375, 0.01209259033203125, 0.014606475830078125, 0.017120361328125, 0.019634246826171875, 0.02214813232421875, 0.024662017822265625, 0.0271759033203125, 0.029689788818359375, 0.03220367431640625, 0.034717559814453125, 0.0372314453125, 0.039745330810546875, 0.04225921630859375, 0.044773101806640625, 0.0472869873046875, 0.049800872802734375, 0.05231475830078125, 0.054828643798828125, 0.057342529296875, 0.059856414794921875, 0.06237030029296875, 0.06488418579101562, 0.0673980712890625, 0.06991195678710938, 0.07242584228515625, 0.07493972778320312, 0.07745361328125]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 6.0, 10.0, 18.0, 19.0, 9.0, 12.0, 15.0, 23.0, 25.0, 25.0, 23.0, 35.0, 41.0, 45.0, 43.0, 43.0, 37.0, 40.0, 53.0, 50.0, 44.0, 42.0, 49.0, 33.0, 32.0, 36.0, 25.0, 23.0, 29.0, 19.0, 16.0, 19.0, 10.0, 8.0, 5.0, 6.0, 6.0, 8.0, 1.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.035369873046875, -0.034188270568847656, -0.03300666809082031, -0.03182506561279297, -0.030643463134765625, -0.02946186065673828, -0.028280258178710938, -0.027098655700683594, -0.02591705322265625, -0.024735450744628906, -0.023553848266601562, -0.02237224578857422, -0.021190643310546875, -0.02000904083251953, -0.018827438354492188, -0.017645835876464844, -0.0164642333984375, -0.015282630920410156, -0.014101028442382812, -0.012919425964355469, -0.011737823486328125, -0.010556221008300781, -0.009374618530273438, -0.008193016052246094, -0.00701141357421875, -0.005829811096191406, -0.0046482086181640625, -0.0034666061401367188, -0.002285003662109375, -0.0011034011840820312, 7.82012939453125e-05, 0.0012598037719726562, 0.00244140625, 0.0036230087280273438, 0.0048046112060546875, 0.005986213684082031, 0.007167816162109375, 0.008349418640136719, 0.009531021118164062, 0.010712623596191406, 0.01189422607421875, 0.013075828552246094, 0.014257431030273438, 0.015439033508300781, 0.016620635986328125, 0.01780223846435547, 0.018983840942382812, 0.020165443420410156, 0.0213470458984375, 0.022528648376464844, 0.023710250854492188, 0.02489185333251953, 0.026073455810546875, 0.02725505828857422, 0.028436660766601562, 0.029618263244628906, 0.03079986572265625, 0.031981468200683594, 0.03316307067871094, 0.03434467315673828, 0.035526275634765625, 0.03670787811279297, 0.03788948059082031, 0.039071083068847656, 0.040252685546875]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 4.0, 5.0, 10.0, 15.0, 23.0, 31.0, 48.0, 68.0, 87.0, 112.0, 209.0, 288.0, 398.0, 556.0, 848.0, 1242.0, 1974.0, 2880.0, 4532.0, 7123.0, 10881.0, 17900.0, 29683.0, 50401.0, 89665.0, 170527.0, 358767.0, 943522.0, 1468602.0, 524591.0, 230840.0, 117023.0, 63872.0, 37233.0, 22215.0, 13534.0, 8720.0, 5413.0, 3490.0, 2277.0, 1486.0, 1021.0, 666.0, 467.0, 311.0, 220.0, 163.0, 108.0, 72.0, 44.0, 40.0, 40.0, 11.0, 17.0, 7.0, 4.0, 3.0, 5.0, 1.0, 0.0, 2.0], "bins": [-0.060150146484375, -0.05822324752807617, -0.056296348571777344, -0.054369449615478516, -0.05244255065917969, -0.05051565170288086, -0.04858875274658203, -0.0466618537902832, -0.044734954833984375, -0.04280805587768555, -0.04088115692138672, -0.03895425796508789, -0.03702735900878906, -0.035100460052490234, -0.033173561096191406, -0.031246662139892578, -0.02931976318359375, -0.027392864227294922, -0.025465965270996094, -0.023539066314697266, -0.021612167358398438, -0.01968526840209961, -0.01775836944580078, -0.015831470489501953, -0.013904571533203125, -0.011977672576904297, -0.010050773620605469, -0.00812387466430664, -0.0061969757080078125, -0.004270076751708984, -0.0023431777954101562, -0.0004162788391113281, 0.0015106201171875, 0.003437519073486328, 0.005364418029785156, 0.007291316986083984, 0.009218215942382812, 0.01114511489868164, 0.013072013854980469, 0.014998912811279297, 0.016925811767578125, 0.018852710723876953, 0.02077960968017578, 0.02270650863647461, 0.024633407592773438, 0.026560306549072266, 0.028487205505371094, 0.030414104461669922, 0.03234100341796875, 0.03426790237426758, 0.036194801330566406, 0.038121700286865234, 0.04004859924316406, 0.04197549819946289, 0.04390239715576172, 0.04582929611206055, 0.047756195068359375, 0.0496830940246582, 0.05160999298095703, 0.05353689193725586, 0.05546379089355469, 0.057390689849853516, 0.059317588806152344, 0.06124448776245117, 0.06317138671875]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 7.0, 5.0, 11.0, 18.0, 21.0, 31.0, 24.0, 57.0, 37.0, 60.0, 61.0, 96.0, 126.0, 134.0, 137.0, 214.0, 210.0, 242.0, 279.0, 323.0, 321.0, 289.0, 246.0, 196.0, 159.0, 135.0, 103.0, 105.0, 77.0, 63.0, 59.0, 55.0, 37.0, 43.0, 23.0, 12.0, 14.0, 12.0, 4.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0199127197265625, -0.019286632537841797, -0.018660545349121094, -0.01803445816040039, -0.017408370971679688, -0.016782283782958984, -0.01615619659423828, -0.015530109405517578, -0.014904022216796875, -0.014277935028076172, -0.013651847839355469, -0.013025760650634766, -0.012399673461914062, -0.01177358627319336, -0.011147499084472656, -0.010521411895751953, -0.00989532470703125, -0.009269237518310547, -0.008643150329589844, -0.00801706314086914, -0.0073909759521484375, -0.006764888763427734, -0.006138801574707031, -0.005512714385986328, -0.004886627197265625, -0.004260540008544922, -0.0036344528198242188, -0.0030083656311035156, -0.0023822784423828125, -0.0017561912536621094, -0.0011301040649414062, -0.0005040168762207031, 0.0001220703125, 0.0007481575012207031, 0.0013742446899414062, 0.0020003318786621094, 0.0026264190673828125, 0.0032525062561035156, 0.0038785934448242188, 0.004504680633544922, 0.005130767822265625, 0.005756855010986328, 0.006382942199707031, 0.007009029388427734, 0.0076351165771484375, 0.00826120376586914, 0.008887290954589844, 0.009513378143310547, 0.01013946533203125, 0.010765552520751953, 0.011391639709472656, 0.01201772689819336, 0.012643814086914062, 0.013269901275634766, 0.013895988464355469, 0.014522075653076172, 0.015148162841796875, 0.015774250030517578, 0.01640033721923828, 0.017026424407958984, 0.017652511596679688, 0.01827859878540039, 0.018904685974121094, 0.019530773162841797, 0.0201568603515625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 3.0, 2.0, 7.0, 6.0, 11.0, 5.0, 15.0, 12.0, 18.0, 23.0, 27.0, 36.0, 55.0, 65.0, 70.0, 98.0, 81.0, 84.0, 80.0, 48.0, 49.0, 40.0, 30.0, 22.0, 21.0, 19.0, 21.0, 7.0, 12.0, 5.0, 9.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0495084673166275, -0.047843873500823975, -0.04617927968502045, -0.04451468586921692, -0.04285008832812309, -0.041185494512319565, -0.03952090069651604, -0.03785630688071251, -0.03619170933961868, -0.034527115523815155, -0.03286252170801163, -0.03119792602956295, -0.029533330351114273, -0.027868736535310745, -0.026204142719507217, -0.02453954890370369, -0.022874955087900162, -0.021210361272096634, -0.019545765593647957, -0.01788117177784443, -0.016216576099395752, -0.014551982283592224, -0.012887388467788696, -0.011222793720662594, -0.009558198973536491, -0.007893604226410389, -0.006229009944945574, -0.004564415663480759, -0.0028998209163546562, -0.0012352261692285538, 0.00042936764657497406, 0.0020939623937010765, 0.0037585608661174774, 0.00542315561324358, 0.007087749894708395, 0.00875234417617321, 0.010416938923299313, 0.012081533670425415, 0.013746127486228943, 0.015410722233355045, 0.017075316980481148, 0.018739910796284676, 0.020404506474733353, 0.02206910029053688, 0.02373369410634041, 0.025398289784789085, 0.027062883600592613, 0.02872747927904129, 0.030392073094844818, 0.032056666910648346, 0.033721260726451874, 0.0353858545422554, 0.03705045208334923, 0.038715045899152756, 0.040379639714956284, 0.04204423353075981, 0.04370883107185364, 0.045373424887657166, 0.04703801870346069, 0.04870261251926422, 0.05036721006035805, 0.052031803876161575, 0.0536963976919651, 0.05536099150776863, 0.05702558532357216]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 0.0, 3.0, 2.0, 5.0, 5.0, 4.0, 3.0, 6.0, 12.0, 17.0, 9.0, 21.0, 26.0, 17.0, 22.0, 19.0, 20.0, 32.0, 32.0, 40.0, 33.0, 40.0, 46.0, 53.0, 41.0, 42.0, 33.0, 50.0, 32.0, 37.0, 50.0, 35.0, 40.0, 30.0, 30.0, 24.0, 14.0, 7.0, 18.0, 15.0, 10.0, 9.0, 7.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.044363878667354584, -0.04304345324635506, -0.04172302782535553, -0.040402598679065704, -0.03908217325806618, -0.03776174783706665, -0.036441318690776825, -0.0351208932697773, -0.03380046784877777, -0.032480042427778244, -0.031159615144133568, -0.02983918786048889, -0.028518762439489365, -0.027198337018489838, -0.02587790973484516, -0.024557482451200485, -0.023237057030200958, -0.02191663160920143, -0.020596204325556755, -0.01927577704191208, -0.017955351620912552, -0.016634926199913025, -0.015314498916268349, -0.013994072563946247, -0.012673646211624146, -0.011353219859302044, -0.010032793506979942, -0.00871236715465784, -0.007391940802335739, -0.0060715144500136375, -0.004751088097691536, -0.0034306617453694344, -0.0021102316677570343, -0.0007898053154349327, 0.0005306210368871689, 0.0018510473892092705, 0.003171473741531372, 0.004491900093853474, 0.005812326446175575, 0.007132752798497677, 0.008453179150819778, 0.00977360550314188, 0.011094031855463982, 0.012414458207786083, 0.013734884560108185, 0.015055310912430286, 0.016375737264752388, 0.017696164548397064, 0.01901658996939659, 0.020337015390396118, 0.021657442674040794, 0.02297786995768547, 0.024298295378684998, 0.025618720799684525, 0.0269391480833292, 0.028259575366973877, 0.029580000787973404, 0.03090042620897293, 0.032220855355262756, 0.03354128077626228, 0.03486170619726181, 0.03618213161826134, 0.037502557039260864, 0.03882298618555069, 0.04014341160655022]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 15.0, 15.0, 16.0, 26.0, 29.0, 47.0, 65.0, 100.0, 133.0, 196.0, 285.0, 406.0, 597.0, 799.0, 1119.0, 1677.0, 2252.0, 3342.0, 4774.0, 7139.0, 10605.0, 16152.0, 24878.0, 39611.0, 65853.0, 120342.0, 234829.0, 224643.0, 114764.0, 63674.0, 38082.0, 23826.0, 15519.0, 10168.0, 6955.0, 4671.0, 3324.0, 2287.0, 1575.0, 1137.0, 782.0, 552.0, 403.0, 281.0, 180.0, 142.0, 87.0, 68.0, 40.0, 38.0, 23.0, 22.0, 9.0, 8.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.0200042724609375, -0.0193784236907959, -0.018752574920654297, -0.018126726150512695, -0.017500877380371094, -0.016875028610229492, -0.01624917984008789, -0.015623331069946289, -0.014997482299804688, -0.014371633529663086, -0.013745784759521484, -0.013119935989379883, -0.012494087219238281, -0.01186823844909668, -0.011242389678955078, -0.010616540908813477, -0.009990692138671875, -0.009364843368530273, -0.008738994598388672, -0.00811314582824707, -0.007487297058105469, -0.006861448287963867, -0.006235599517822266, -0.005609750747680664, -0.0049839019775390625, -0.004358053207397461, -0.0037322044372558594, -0.003106355667114258, -0.0024805068969726562, -0.0018546581268310547, -0.0012288093566894531, -0.0006029605865478516, 2.288818359375e-05, 0.0006487369537353516, 0.0012745857238769531, 0.0019004344940185547, 0.0025262832641601562, 0.003152132034301758, 0.0037779808044433594, 0.004403829574584961, 0.0050296783447265625, 0.005655527114868164, 0.006281375885009766, 0.006907224655151367, 0.007533073425292969, 0.00815892219543457, 0.008784770965576172, 0.009410619735717773, 0.010036468505859375, 0.010662317276000977, 0.011288166046142578, 0.01191401481628418, 0.012539863586425781, 0.013165712356567383, 0.013791561126708984, 0.014417409896850586, 0.015043258666992188, 0.01566910743713379, 0.01629495620727539, 0.016920804977416992, 0.017546653747558594, 0.018172502517700195, 0.018798351287841797, 0.0194242000579834, 0.020050048828125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 6.0, 4.0, 6.0, 12.0, 7.0, 9.0, 16.0, 24.0, 19.0, 20.0, 15.0, 21.0, 28.0, 35.0, 29.0, 37.0, 30.0, 30.0, 46.0, 54.0, 38.0, 45.0, 41.0, 46.0, 39.0, 28.0, 38.0, 42.0, 31.0, 33.0, 27.0, 23.0, 19.0, 22.0, 10.0, 14.0, 14.0, 11.0, 6.0, 8.0, 4.0, 5.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.04388427734375, -0.04258918762207031, -0.041294097900390625, -0.03999900817871094, -0.03870391845703125, -0.03740882873535156, -0.036113739013671875, -0.03481864929199219, -0.0335235595703125, -0.03222846984863281, -0.030933380126953125, -0.029638290405273438, -0.02834320068359375, -0.027048110961914062, -0.025753021240234375, -0.024457931518554688, -0.023162841796875, -0.021867752075195312, -0.020572662353515625, -0.019277572631835938, -0.01798248291015625, -0.016687393188476562, -0.015392303466796875, -0.014097213745117188, -0.0128021240234375, -0.011507034301757812, -0.010211944580078125, -0.008916854858398438, -0.00762176513671875, -0.0063266754150390625, -0.005031585693359375, -0.0037364959716796875, -0.00244140625, -0.0011463165283203125, 0.000148773193359375, 0.0014438629150390625, 0.00273895263671875, 0.0040340423583984375, 0.005329132080078125, 0.0066242218017578125, 0.0079193115234375, 0.009214401245117188, 0.010509490966796875, 0.011804580688476562, 0.01309967041015625, 0.014394760131835938, 0.015689849853515625, 0.016984939575195312, 0.018280029296875, 0.019575119018554688, 0.020870208740234375, 0.022165298461914062, 0.02346038818359375, 0.024755477905273438, 0.026050567626953125, 0.027345657348632812, 0.0286407470703125, 0.029935836791992188, 0.031230926513671875, 0.03252601623535156, 0.03382110595703125, 0.03511619567871094, 0.036411285400390625, 0.03770637512207031, 0.03900146484375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 8.0, 14.0, 22.0, 27.0, 42.0, 56.0, 84.0, 128.0, 164.0, 254.0, 461.0, 653.0, 958.0, 1491.0, 2208.0, 3685.0, 6162.0, 10954.0, 22969.0, 64948.0, 308185.0, 476639.0, 88399.0, 29074.0, 12678.0, 6846.0, 4063.0, 2565.0, 1564.0, 1090.0, 719.0, 477.0, 310.0, 214.0, 115.0, 79.0, 68.0, 63.0, 41.0, 20.0, 18.0, 12.0, 8.0, 3.0, 6.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04840087890625, -0.0469822883605957, -0.045563697814941406, -0.04414510726928711, -0.04272651672363281, -0.041307926177978516, -0.03988933563232422, -0.03847074508666992, -0.037052154541015625, -0.03563356399536133, -0.03421497344970703, -0.032796382904052734, -0.03137779235839844, -0.02995920181274414, -0.028540611267089844, -0.027122020721435547, -0.02570343017578125, -0.024284839630126953, -0.022866249084472656, -0.02144765853881836, -0.020029067993164062, -0.018610477447509766, -0.01719188690185547, -0.015773296356201172, -0.014354705810546875, -0.012936115264892578, -0.011517524719238281, -0.010098934173583984, -0.008680343627929688, -0.007261753082275391, -0.005843162536621094, -0.004424571990966797, -0.0030059814453125, -0.0015873908996582031, -0.00016880035400390625, 0.0012497901916503906, 0.0026683807373046875, 0.004086971282958984, 0.005505561828613281, 0.006924152374267578, 0.008342742919921875, 0.009761333465576172, 0.011179924011230469, 0.012598514556884766, 0.014017105102539062, 0.01543569564819336, 0.016854286193847656, 0.018272876739501953, 0.01969146728515625, 0.021110057830810547, 0.022528648376464844, 0.02394723892211914, 0.025365829467773438, 0.026784420013427734, 0.02820301055908203, 0.029621601104736328, 0.031040191650390625, 0.03245878219604492, 0.03387737274169922, 0.035295963287353516, 0.03671455383300781, 0.03813314437866211, 0.039551734924316406, 0.0409703254699707, 0.042388916015625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 5.0, 18.0, 12.0, 14.0, 9.0, 20.0, 18.0, 18.0, 24.0, 24.0, 25.0, 21.0, 41.0, 39.0, 40.0, 32.0, 49.0, 43.0, 40.0, 36.0, 40.0, 53.0, 46.0, 31.0, 35.0, 32.0, 30.0, 27.0, 24.0, 22.0, 14.0, 23.0, 18.0, 11.0, 12.0, 13.0, 8.0, 8.0, 4.0, 6.0, 6.0, 6.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0232696533203125, -0.02243971824645996, -0.021609783172607422, -0.020779848098754883, -0.019949913024902344, -0.019119977951049805, -0.018290042877197266, -0.017460107803344727, -0.016630172729492188, -0.01580023765563965, -0.01497030258178711, -0.01414036750793457, -0.013310432434082031, -0.012480497360229492, -0.011650562286376953, -0.010820627212524414, -0.009990692138671875, -0.009160757064819336, -0.008330821990966797, -0.007500886917114258, -0.006670951843261719, -0.00584101676940918, -0.005011081695556641, -0.0041811466217041016, -0.0033512115478515625, -0.0025212764739990234, -0.0016913414001464844, -0.0008614063262939453, -3.147125244140625e-05, 0.0007984638214111328, 0.0016283988952636719, 0.002458333969116211, 0.00328826904296875, 0.004118204116821289, 0.004948139190673828, 0.005778074264526367, 0.006608009338378906, 0.007437944412231445, 0.008267879486083984, 0.009097814559936523, 0.009927749633789062, 0.010757684707641602, 0.01158761978149414, 0.01241755485534668, 0.013247489929199219, 0.014077425003051758, 0.014907360076904297, 0.015737295150756836, 0.016567230224609375, 0.017397165298461914, 0.018227100372314453, 0.019057035446166992, 0.01988697052001953, 0.02071690559387207, 0.02154684066772461, 0.02237677574157715, 0.023206710815429688, 0.024036645889282227, 0.024866580963134766, 0.025696516036987305, 0.026526451110839844, 0.027356386184692383, 0.028186321258544922, 0.02901625633239746, 0.02984619140625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 7.0, 10.0, 16.0, 18.0, 33.0, 41.0, 47.0, 52.0, 75.0, 121.0, 125.0, 246.0, 273.0, 432.0, 497.0, 720.0, 1186.0, 1747.0, 2805.0, 5231.0, 10011.0, 23990.0, 85555.0, 720283.0, 136345.0, 30811.0, 12168.0, 6011.0, 3445.0, 2026.0, 1260.0, 809.0, 598.0, 391.0, 296.0, 221.0, 170.0, 124.0, 100.0, 53.0, 63.0, 33.0, 26.0, 32.0, 10.0, 6.0, 14.0, 9.0, 5.0, 6.0, 2.0, 0.0, 3.0], "bins": [-0.005161285400390625, -0.005012214183807373, -0.004863142967224121, -0.004714071750640869, -0.004565000534057617, -0.004415929317474365, -0.004266858100891113, -0.004117786884307861, -0.003968715667724609, -0.0038196444511413574, -0.0036705732345581055, -0.0035215020179748535, -0.0033724308013916016, -0.0032233595848083496, -0.0030742883682250977, -0.0029252171516418457, -0.0027761459350585938, -0.002627074718475342, -0.00247800350189209, -0.002328932285308838, -0.002179861068725586, -0.002030789852142334, -0.001881718635559082, -0.00173264741897583, -0.0015835762023925781, -0.0014345049858093262, -0.0012854337692260742, -0.0011363625526428223, -0.0009872913360595703, -0.0008382201194763184, -0.0006891489028930664, -0.0005400776863098145, -0.0003910064697265625, -0.00024193525314331055, -9.28640365600586e-05, 5.620718002319336e-05, 0.0002052783966064453, 0.00035434961318969727, 0.0005034208297729492, 0.0006524920463562012, 0.0008015632629394531, 0.0009506344795227051, 0.001099705696105957, 0.001248776912689209, 0.001397848129272461, 0.0015469193458557129, 0.0016959905624389648, 0.0018450617790222168, 0.0019941329956054688, 0.0021432042121887207, 0.0022922754287719727, 0.0024413466453552246, 0.0025904178619384766, 0.0027394890785217285, 0.0028885602951049805, 0.0030376315116882324, 0.0031867027282714844, 0.0033357739448547363, 0.0034848451614379883, 0.0036339163780212402, 0.003782987594604492, 0.003932058811187744, 0.004081130027770996, 0.004230201244354248, 0.0043792724609375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 4.0, 0.0, 14.0, 0.0, 21.0, 0.0, 25.0, 0.0, 0.0, 41.0, 0.0, 52.0, 0.0, 60.0, 0.0, 103.0, 0.0, 123.0, 0.0, 0.0, 119.0, 0.0, 115.0, 0.0, 108.0, 0.0, 72.0, 0.0, 55.0, 0.0, 0.0, 35.0, 0.0, 26.0, 0.0, 14.0, 0.0, 14.0, 0.0, 8.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.940696716308594e-07, -8.670613169670105e-07, -8.400529623031616e-07, -8.130446076393127e-07, -7.860362529754639e-07, -7.59027898311615e-07, -7.320195436477661e-07, -7.050111889839172e-07, -6.780028343200684e-07, -6.509944796562195e-07, -6.239861249923706e-07, -5.969777703285217e-07, -5.699694156646729e-07, -5.42961061000824e-07, -5.159527063369751e-07, -4.889443516731262e-07, -4.6193599700927734e-07, -4.3492764234542847e-07, -4.079192876815796e-07, -3.809109330177307e-07, -3.5390257835388184e-07, -3.2689422369003296e-07, -2.998858690261841e-07, -2.728775143623352e-07, -2.4586915969848633e-07, -2.1886080503463745e-07, -1.9185245037078857e-07, -1.648440957069397e-07, -1.3783574104309082e-07, -1.1082738637924194e-07, -8.381903171539307e-08, -5.681067705154419e-08, -2.9802322387695312e-08, -2.7939677238464355e-09, 2.421438694000244e-08, 5.122274160385132e-08, 7.82310962677002e-08, 1.0523945093154907e-07, 1.3224780559539795e-07, 1.5925616025924683e-07, 1.862645149230957e-07, 2.1327286958694458e-07, 2.4028122425079346e-07, 2.6728957891464233e-07, 2.942979335784912e-07, 3.213062882423401e-07, 3.4831464290618896e-07, 3.7532299757003784e-07, 4.023313522338867e-07, 4.293397068977356e-07, 4.5634806156158447e-07, 4.833564162254333e-07, 5.103647708892822e-07, 5.373731255531311e-07, 5.6438148021698e-07, 5.913898348808289e-07, 6.183981895446777e-07, 6.454065442085266e-07, 6.724148988723755e-07, 6.994232535362244e-07, 7.264316082000732e-07, 7.534399628639221e-07, 7.80448317527771e-07, 8.074566721916199e-07, 8.344650268554688e-07]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 9.0, 5.0, 5.0, 13.0, 27.0, 26.0, 28.0, 52.0, 72.0, 94.0, 111.0, 170.0, 222.0, 286.0, 429.0, 553.0, 720.0, 1044.0, 1537.0, 2138.0, 3178.0, 4460.0, 6974.0, 11204.0, 19486.0, 37985.0, 90520.0, 325470.0, 353496.0, 94693.0, 39574.0, 19919.0, 11502.0, 7107.0, 4621.0, 3198.0, 2177.0, 1531.0, 1065.0, 788.0, 563.0, 377.0, 305.0, 219.0, 172.0, 130.0, 73.0, 60.0, 51.0, 39.0, 25.0, 17.0, 13.0, 11.0, 9.0, 5.0, 3.0, 1.0, 2.0, 3.0], "bins": [-0.0028228759765625, -0.0027347207069396973, -0.0026465654373168945, -0.002558410167694092, -0.002470254898071289, -0.0023820996284484863, -0.0022939443588256836, -0.002205789089202881, -0.002117633819580078, -0.0020294785499572754, -0.0019413232803344727, -0.00185316801071167, -0.0017650127410888672, -0.0016768574714660645, -0.0015887022018432617, -0.001500546932220459, -0.0014123916625976562, -0.0013242363929748535, -0.0012360811233520508, -0.001147925853729248, -0.0010597705841064453, -0.0009716153144836426, -0.0008834600448608398, -0.0007953047752380371, -0.0007071495056152344, -0.0006189942359924316, -0.0005308389663696289, -0.00044268369674682617, -0.00035452842712402344, -0.0002663731575012207, -0.00017821788787841797, -9.006261825561523e-05, -1.9073486328125e-06, 8.624792098999023e-05, 0.00017440319061279297, 0.0002625584602355957, 0.00035071372985839844, 0.00043886899948120117, 0.0005270242691040039, 0.0006151795387268066, 0.0007033348083496094, 0.0007914900779724121, 0.0008796453475952148, 0.0009678006172180176, 0.0010559558868408203, 0.001144111156463623, 0.0012322664260864258, 0.0013204216957092285, 0.0014085769653320312, 0.001496732234954834, 0.0015848875045776367, 0.0016730427742004395, 0.0017611980438232422, 0.001849353313446045, 0.0019375085830688477, 0.0020256638526916504, 0.002113819122314453, 0.002201974391937256, 0.0022901296615600586, 0.0023782849311828613, 0.002466440200805664, 0.002554595470428467, 0.0026427507400512695, 0.0027309060096740723, 0.002819061279296875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 1.0, 2.0, 3.0, 6.0, 5.0, 1.0, 8.0, 6.0, 11.0, 14.0, 15.0, 28.0, 55.0, 76.0, 77.0, 111.0, 143.0, 105.0, 91.0, 68.0, 60.0, 27.0, 13.0, 14.0, 16.0, 8.0, 8.0, 8.0, 3.0, 2.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0008721351623535156, -0.0008436143398284912, -0.0008150935173034668, -0.0007865726947784424, -0.000758051872253418, -0.0007295310497283936, -0.0007010102272033691, -0.0006724894046783447, -0.0006439685821533203, -0.0006154477596282959, -0.0005869269371032715, -0.0005584061145782471, -0.0005298852920532227, -0.0005013644695281982, -0.00047284364700317383, -0.0004443228244781494, -0.000415802001953125, -0.0003872811794281006, -0.00035876035690307617, -0.00033023953437805176, -0.00030171871185302734, -0.00027319788932800293, -0.0002446770668029785, -0.0002161562442779541, -0.0001876354217529297, -0.00015911459922790527, -0.00013059377670288086, -0.00010207295417785645, -7.355213165283203e-05, -4.503130912780762e-05, -1.6510486602783203e-05, 1.2010335922241211e-05, 4.0531158447265625e-05, 6.905198097229004e-05, 9.757280349731445e-05, 0.00012609362602233887, 0.00015461444854736328, 0.0001831352710723877, 0.0002116560935974121, 0.00024017691612243652, 0.00026869773864746094, 0.00029721856117248535, 0.00032573938369750977, 0.0003542602062225342, 0.0003827810287475586, 0.000411301851272583, 0.0004398226737976074, 0.00046834349632263184, 0.0004968643188476562, 0.0005253851413726807, 0.0005539059638977051, 0.0005824267864227295, 0.0006109476089477539, 0.0006394684314727783, 0.0006679892539978027, 0.0006965100765228271, 0.0007250308990478516, 0.000753551721572876, 0.0007820725440979004, 0.0008105933666229248, 0.0008391141891479492, 0.0008676350116729736, 0.000896155834197998, 0.0009246766567230225, 0.0009531974792480469]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 2.0, 3.0, 6.0, 6.0, 11.0, 9.0, 8.0, 14.0, 15.0, 25.0, 23.0, 43.0, 52.0, 63.0, 74.0, 84.0, 84.0, 106.0, 69.0, 63.0, 35.0, 36.0, 34.0, 21.0, 27.0, 20.0, 13.0, 16.0, 8.0, 8.0, 3.0, 1.0, 0.0, 5.0, 0.0, 1.0, 4.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.04984677955508232, -0.04817146062850952, -0.04649614170193672, -0.04482082277536392, -0.04314550384879112, -0.04147018492221832, -0.03979486599564552, -0.03811954706907272, -0.036444228142499924, -0.034768909215927124, -0.033093590289354324, -0.031418271362781525, -0.029742952436208725, -0.028067633509635925, -0.026392314583063126, -0.024716995656490326, -0.023041676729917526, -0.021366357803344727, -0.019691038876771927, -0.018015719950199127, -0.016340401023626328, -0.014665082097053528, -0.012989763170480728, -0.011314444243907928, -0.009639125317335129, -0.007963806390762329, -0.006288487464189529, -0.00461316853761673, -0.00293784961104393, -0.0012625306844711304, 0.0004127882421016693, 0.002088107168674469, 0.0037634260952472687, 0.005438745021820068, 0.007114063948392868, 0.008789382874965668, 0.010464701801538467, 0.012140020728111267, 0.013815339654684067, 0.015490658581256866, 0.017165977507829666, 0.018841296434402466, 0.020516615360975266, 0.022191934287548065, 0.023867253214120865, 0.025542572140693665, 0.027217891067266464, 0.028893209993839264, 0.030568528920412064, 0.03224384784698486, 0.03391916677355766, 0.03559448570013046, 0.03726980462670326, 0.03894512355327606, 0.04062044247984886, 0.04229576140642166, 0.04397108033299446, 0.04564639925956726, 0.04732171818614006, 0.04899703711271286, 0.05067235603928566, 0.05234767496585846, 0.05402299389243126, 0.05569831281900406, 0.05737363174557686]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 0.0, 3.0, 2.0, 5.0, 5.0, 3.0, 5.0, 5.0, 12.0, 17.0, 9.0, 22.0, 23.0, 20.0, 22.0, 18.0, 21.0, 31.0, 29.0, 43.0, 33.0, 41.0, 43.0, 53.0, 39.0, 42.0, 35.0, 51.0, 33.0, 34.0, 50.0, 35.0, 45.0, 25.0, 32.0, 24.0, 16.0, 5.0, 17.0, 17.0, 10.0, 8.0, 9.0, 6.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.04418788105249405, -0.0428764782845974, -0.041565075516700745, -0.04025367647409439, -0.03894227370619774, -0.037630870938301086, -0.036319468170404434, -0.03500806540250778, -0.03369666635990143, -0.032385263592004776, -0.031073862686753273, -0.02976245991885662, -0.028451059013605118, -0.027139656245708466, -0.025828253477811813, -0.02451685070991516, -0.02320544794201851, -0.021894045174121857, -0.020582644268870354, -0.0192712415009737, -0.0179598405957222, -0.016648437827825546, -0.015337035059928894, -0.014025633223354816, -0.012714231386780739, -0.011402829550206661, -0.010091427713632584, -0.008780024945735931, -0.007468623109161854, -0.006157221272587776, -0.004845818504691124, -0.0035344166681170464, -0.002223018556833267, -0.000911616487428546, 0.0003997855819761753, 0.0017111878842115402, 0.003022589720785618, 0.0043339915573596954, 0.005645394325256348, 0.006956796161830425, 0.008268197998404503, 0.00957959983497858, 0.010891001671552658, 0.01220240443944931, 0.013513806276023388, 0.014825208112597466, 0.016136610880494118, 0.01744801178574562, 0.018759414553642273, 0.020070817321538925, 0.021382218226790428, 0.02269362099468708, 0.024005021899938583, 0.025316424667835236, 0.026627827435731888, 0.02793923020362854, 0.029250631108880043, 0.030562033876776695, 0.0318734347820282, 0.03318483754992485, 0.0344962403178215, 0.035807639360427856, 0.03711904585361481, 0.03843044489622116, 0.03974184766411781]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 8.0, 8.0, 12.0, 12.0, 27.0, 40.0, 41.0, 83.0, 134.0, 192.0, 274.0, 419.0, 598.0, 833.0, 1297.0, 1997.0, 3054.0, 4745.0, 7087.0, 11219.0, 17605.0, 28763.0, 48549.0, 85978.0, 170053.0, 289282.0, 166284.0, 84867.0, 47719.0, 28177.0, 17485.0, 11039.0, 6978.0, 4486.0, 3069.0, 1997.0, 1307.0, 872.0, 650.0, 414.0, 239.0, 202.0, 141.0, 91.0, 57.0, 62.0, 35.0, 25.0, 16.0, 13.0, 10.0, 2.0, 6.0, 0.0, 2.0, 2.0], "bins": [-0.081787109375, -0.0793447494506836, -0.07690238952636719, -0.07446002960205078, -0.07201766967773438, -0.06957530975341797, -0.06713294982910156, -0.06469058990478516, -0.06224822998046875, -0.059805870056152344, -0.05736351013183594, -0.05492115020751953, -0.052478790283203125, -0.05003643035888672, -0.04759407043457031, -0.045151710510253906, -0.0427093505859375, -0.040266990661621094, -0.03782463073730469, -0.03538227081298828, -0.032939910888671875, -0.03049755096435547, -0.028055191040039062, -0.025612831115722656, -0.02317047119140625, -0.020728111267089844, -0.018285751342773438, -0.01584339141845703, -0.013401031494140625, -0.010958671569824219, -0.008516311645507812, -0.006073951721191406, -0.003631591796875, -0.0011892318725585938, 0.0012531280517578125, 0.0036954879760742188, 0.006137847900390625, 0.008580207824707031, 0.011022567749023438, 0.013464927673339844, 0.01590728759765625, 0.018349647521972656, 0.020792007446289062, 0.02323436737060547, 0.025676727294921875, 0.02811908721923828, 0.030561447143554688, 0.033003807067871094, 0.0354461669921875, 0.037888526916503906, 0.04033088684082031, 0.04277324676513672, 0.045215606689453125, 0.04765796661376953, 0.05010032653808594, 0.052542686462402344, 0.05498504638671875, 0.057427406311035156, 0.05986976623535156, 0.06231212615966797, 0.06475448608398438, 0.06719684600830078, 0.06963920593261719, 0.0720815658569336, 0.07452392578125]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 2.0, 2.0, 7.0, 1.0, 0.0, 4.0, 3.0, 5.0, 10.0, 14.0, 14.0, 15.0, 15.0, 14.0, 13.0, 20.0, 26.0, 19.0, 29.0, 26.0, 32.0, 37.0, 40.0, 36.0, 40.0, 59.0, 37.0, 44.0, 40.0, 37.0, 38.0, 45.0, 37.0, 37.0, 30.0, 24.0, 30.0, 28.0, 20.0, 9.0, 10.0, 11.0, 11.0, 6.0, 12.0, 5.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.039581298828125, -0.038458824157714844, -0.03733634948730469, -0.03621387481689453, -0.035091400146484375, -0.03396892547607422, -0.03284645080566406, -0.031723976135253906, -0.03060150146484375, -0.029479026794433594, -0.028356552124023438, -0.02723407745361328, -0.026111602783203125, -0.02498912811279297, -0.023866653442382812, -0.022744178771972656, -0.0216217041015625, -0.020499229431152344, -0.019376754760742188, -0.01825428009033203, -0.017131805419921875, -0.01600933074951172, -0.014886856079101562, -0.013764381408691406, -0.01264190673828125, -0.011519432067871094, -0.010396957397460938, -0.009274482727050781, -0.008152008056640625, -0.007029533386230469, -0.0059070587158203125, -0.004784584045410156, -0.003662109375, -0.0025396347045898438, -0.0014171600341796875, -0.00029468536376953125, 0.000827789306640625, 0.0019502639770507812, 0.0030727386474609375, 0.004195213317871094, 0.00531768798828125, 0.006440162658691406, 0.0075626373291015625, 0.008685111999511719, 0.009807586669921875, 0.010930061340332031, 0.012052536010742188, 0.013175010681152344, 0.0142974853515625, 0.015419960021972656, 0.016542434692382812, 0.01766490936279297, 0.018787384033203125, 0.01990985870361328, 0.021032333374023438, 0.022154808044433594, 0.02327728271484375, 0.024399757385253906, 0.025522232055664062, 0.02664470672607422, 0.027767181396484375, 0.02888965606689453, 0.030012130737304688, 0.031134605407714844, 0.032257080078125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 9.0, 8.0, 20.0, 20.0, 41.0, 46.0, 73.0, 102.0, 132.0, 219.0, 313.0, 423.0, 623.0, 927.0, 1275.0, 2000.0, 2918.0, 4170.0, 6469.0, 9814.0, 15106.0, 24252.0, 39640.0, 69036.0, 129423.0, 271035.0, 215606.0, 104320.0, 57016.0, 33861.0, 20785.0, 13076.0, 8481.0, 5403.0, 3799.0, 2556.0, 1742.0, 1138.0, 818.0, 578.0, 405.0, 260.0, 203.0, 137.0, 81.0, 67.0, 41.0, 29.0, 21.0, 19.0, 5.0, 11.0, 1.0, 4.0, 2.0, 2.0, 2.0], "bins": [-0.07537841796875, -0.07308292388916016, -0.07078742980957031, -0.06849193572998047, -0.06619644165039062, -0.06390094757080078, -0.06160545349121094, -0.059309959411621094, -0.05701446533203125, -0.054718971252441406, -0.05242347717285156, -0.05012798309326172, -0.047832489013671875, -0.04553699493408203, -0.04324150085449219, -0.040946006774902344, -0.0386505126953125, -0.036355018615722656, -0.03405952453613281, -0.03176403045654297, -0.029468536376953125, -0.02717304229736328, -0.024877548217773438, -0.022582054138183594, -0.02028656005859375, -0.017991065979003906, -0.015695571899414062, -0.013400077819824219, -0.011104583740234375, -0.008809089660644531, -0.0065135955810546875, -0.004218101501464844, -0.001922607421875, 0.00037288665771484375, 0.0026683807373046875, 0.004963874816894531, 0.007259368896484375, 0.009554862976074219, 0.011850357055664062, 0.014145851135253906, 0.01644134521484375, 0.018736839294433594, 0.021032333374023438, 0.02332782745361328, 0.025623321533203125, 0.02791881561279297, 0.030214309692382812, 0.032509803771972656, 0.0348052978515625, 0.037100791931152344, 0.03939628601074219, 0.04169178009033203, 0.043987274169921875, 0.04628276824951172, 0.04857826232910156, 0.050873756408691406, 0.05316925048828125, 0.055464744567871094, 0.05776023864746094, 0.06005573272705078, 0.062351226806640625, 0.06464672088623047, 0.06694221496582031, 0.06923770904541016, 0.071533203125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 3.0, 5.0, 2.0, 7.0, 13.0, 8.0, 14.0, 15.0, 16.0, 15.0, 17.0, 24.0, 19.0, 34.0, 35.0, 32.0, 44.0, 40.0, 42.0, 35.0, 45.0, 30.0, 49.0, 41.0, 53.0, 38.0, 43.0, 38.0, 23.0, 26.0, 29.0, 28.0, 23.0, 16.0, 19.0, 17.0, 19.0, 10.0, 10.0, 6.0, 6.0, 3.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0209503173828125, -0.02022719383239746, -0.019504070281982422, -0.018780946731567383, -0.018057823181152344, -0.017334699630737305, -0.016611576080322266, -0.015888452529907227, -0.015165328979492188, -0.014442205429077148, -0.01371908187866211, -0.01299595832824707, -0.012272834777832031, -0.011549711227416992, -0.010826587677001953, -0.010103464126586914, -0.009380340576171875, -0.008657217025756836, -0.007934093475341797, -0.007210969924926758, -0.006487846374511719, -0.00576472282409668, -0.005041599273681641, -0.0043184757232666016, -0.0035953521728515625, -0.0028722286224365234, -0.0021491050720214844, -0.0014259815216064453, -0.0007028579711914062, 2.0265579223632812e-05, 0.0007433891296386719, 0.001466512680053711, 0.00218963623046875, 0.002912759780883789, 0.003635883331298828, 0.004359006881713867, 0.005082130432128906, 0.005805253982543945, 0.006528377532958984, 0.0072515010833740234, 0.007974624633789062, 0.008697748184204102, 0.00942087173461914, 0.01014399528503418, 0.010867118835449219, 0.011590242385864258, 0.012313365936279297, 0.013036489486694336, 0.013759613037109375, 0.014482736587524414, 0.015205860137939453, 0.015928983688354492, 0.01665210723876953, 0.01737523078918457, 0.01809835433959961, 0.01882147789001465, 0.019544601440429688, 0.020267724990844727, 0.020990848541259766, 0.021713972091674805, 0.022437095642089844, 0.023160219192504883, 0.023883342742919922, 0.02460646629333496, 0.02532958984375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 4.0, 8.0, 7.0, 8.0, 14.0, 17.0, 24.0, 34.0, 48.0, 70.0, 96.0, 133.0, 171.0, 226.0, 356.0, 501.0, 738.0, 1009.0, 1457.0, 2094.0, 3104.0, 4681.0, 7807.0, 13058.0, 25410.0, 78028.0, 769481.0, 78420.0, 25589.0, 13133.0, 7865.0, 4904.0, 3087.0, 2094.0, 1455.0, 1028.0, 679.0, 508.0, 314.0, 252.0, 192.0, 130.0, 84.0, 71.0, 42.0, 35.0, 32.0, 22.0, 11.0, 9.0, 7.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0105743408203125, -0.010227680206298828, -0.009881019592285156, -0.009534358978271484, -0.009187698364257812, -0.00884103775024414, -0.008494377136230469, -0.008147716522216797, -0.007801055908203125, -0.007454395294189453, -0.007107734680175781, -0.006761074066162109, -0.0064144134521484375, -0.006067752838134766, -0.005721092224121094, -0.005374431610107422, -0.00502777099609375, -0.004681110382080078, -0.004334449768066406, -0.003987789154052734, -0.0036411285400390625, -0.0032944679260253906, -0.0029478073120117188, -0.002601146697998047, -0.002254486083984375, -0.0019078254699707031, -0.0015611648559570312, -0.0012145042419433594, -0.0008678436279296875, -0.0005211830139160156, -0.00017452239990234375, 0.00017213821411132812, 0.000518798828125, 0.0008654594421386719, 0.0012121200561523438, 0.0015587806701660156, 0.0019054412841796875, 0.0022521018981933594, 0.0025987625122070312, 0.002945423126220703, 0.003292083740234375, 0.003638744354248047, 0.003985404968261719, 0.004332065582275391, 0.0046787261962890625, 0.005025386810302734, 0.005372047424316406, 0.005718708038330078, 0.00606536865234375, 0.006412029266357422, 0.006758689880371094, 0.007105350494384766, 0.0074520111083984375, 0.007798671722412109, 0.008145332336425781, 0.008491992950439453, 0.008838653564453125, 0.009185314178466797, 0.009531974792480469, 0.00987863540649414, 0.010225296020507812, 0.010571956634521484, 0.010918617248535156, 0.011265277862548828, 0.0116119384765625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 12.0, 0.0, 0.0, 15.0, 0.0, 26.0, 0.0, 0.0, 43.0, 0.0, 79.0, 0.0, 0.0, 101.0, 0.0, 147.0, 0.0, 0.0, 159.0, 0.0, 168.0, 0.0, 103.0, 0.0, 0.0, 71.0, 0.0, 37.0, 0.0, 0.0, 12.0, 0.0, 20.0, 0.0, 0.0, 7.0, 0.0, 6.0, 0.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.748603820800781e-07, -7.506459951400757e-07, -7.264316082000732e-07, -7.022172212600708e-07, -6.780028343200684e-07, -6.537884473800659e-07, -6.295740604400635e-07, -6.05359673500061e-07, -5.811452865600586e-07, -5.569308996200562e-07, -5.327165126800537e-07, -5.085021257400513e-07, -4.842877388000488e-07, -4.600733518600464e-07, -4.3585896492004395e-07, -4.116445779800415e-07, -3.8743019104003906e-07, -3.632158041000366e-07, -3.390014171600342e-07, -3.1478703022003174e-07, -2.905726432800293e-07, -2.6635825634002686e-07, -2.421438694000244e-07, -2.1792948246002197e-07, -1.9371509552001953e-07, -1.695007085800171e-07, -1.4528632164001465e-07, -1.210719347000122e-07, -9.685754776000977e-08, -7.264316082000732e-08, -4.842877388000488e-08, -2.421438694000244e-08, 0.0, 2.421438694000244e-08, 4.842877388000488e-08, 7.264316082000732e-08, 9.685754776000977e-08, 1.210719347000122e-07, 1.4528632164001465e-07, 1.695007085800171e-07, 1.9371509552001953e-07, 2.1792948246002197e-07, 2.421438694000244e-07, 2.6635825634002686e-07, 2.905726432800293e-07, 3.1478703022003174e-07, 3.390014171600342e-07, 3.632158041000366e-07, 3.8743019104003906e-07, 4.116445779800415e-07, 4.3585896492004395e-07, 4.600733518600464e-07, 4.842877388000488e-07, 5.085021257400513e-07, 5.327165126800537e-07, 5.569308996200562e-07, 5.811452865600586e-07, 6.05359673500061e-07, 6.295740604400635e-07, 6.537884473800659e-07, 6.780028343200684e-07, 7.022172212600708e-07, 7.264316082000732e-07, 7.506459951400757e-07, 7.748603820800781e-07]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 4.0, 5.0, 4.0, 7.0, 12.0, 8.0, 24.0, 24.0, 29.0, 43.0, 48.0, 89.0, 102.0, 129.0, 173.0, 235.0, 326.0, 453.0, 655.0, 972.0, 1441.0, 2369.0, 3981.0, 6755.0, 13035.0, 27566.0, 103852.0, 789755.0, 51710.0, 20021.0, 10030.0, 5488.0, 3094.0, 1978.0, 1223.0, 785.0, 557.0, 407.0, 280.0, 240.0, 137.0, 136.0, 87.0, 61.0, 56.0, 44.0, 29.0, 26.0, 22.0, 15.0, 13.0, 8.0, 5.0, 7.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.01479339599609375, -0.0143052339553833, -0.013817071914672852, -0.013328909873962402, -0.012840747833251953, -0.012352585792541504, -0.011864423751831055, -0.011376261711120605, -0.010888099670410156, -0.010399937629699707, -0.009911775588989258, -0.009423613548278809, -0.00893545150756836, -0.00844728946685791, -0.007959127426147461, -0.007470965385437012, -0.0069828033447265625, -0.006494641304016113, -0.006006479263305664, -0.005518317222595215, -0.005030155181884766, -0.004541993141174316, -0.004053831100463867, -0.003565669059753418, -0.0030775070190429688, -0.0025893449783325195, -0.0021011829376220703, -0.001613020896911621, -0.0011248588562011719, -0.0006366968154907227, -0.00014853477478027344, 0.0003396272659301758, 0.000827789306640625, 0.0013159513473510742, 0.0018041133880615234, 0.0022922754287719727, 0.002780437469482422, 0.003268599510192871, 0.0037567615509033203, 0.0042449235916137695, 0.004733085632324219, 0.005221247673034668, 0.005709409713745117, 0.006197571754455566, 0.006685733795166016, 0.007173895835876465, 0.007662057876586914, 0.008150219917297363, 0.008638381958007812, 0.009126543998718262, 0.009614706039428711, 0.01010286808013916, 0.01059103012084961, 0.011079192161560059, 0.011567354202270508, 0.012055516242980957, 0.012543678283691406, 0.013031840324401855, 0.013520002365112305, 0.014008164405822754, 0.014496326446533203, 0.014984488487243652, 0.015472650527954102, 0.01596081256866455, 0.016448974609375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 6.0, 9.0, 6.0, 8.0, 12.0, 16.0, 22.0, 24.0, 43.0, 303.0, 367.0, 59.0, 19.0, 19.0, 16.0, 9.0, 17.0, 8.0, 5.0, 6.0, 9.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00457763671875, -0.004425168037414551, -0.0042726993560791016, -0.004120230674743652, -0.003967761993408203, -0.003815293312072754, -0.0036628246307373047, -0.0035103559494018555, -0.0033578872680664062, -0.003205418586730957, -0.003052949905395508, -0.0029004812240600586, -0.0027480125427246094, -0.00259554386138916, -0.002443075180053711, -0.0022906064987182617, -0.0021381378173828125, -0.0019856691360473633, -0.001833200454711914, -0.0016807317733764648, -0.0015282630920410156, -0.0013757944107055664, -0.0012233257293701172, -0.001070857048034668, -0.0009183883666992188, -0.0007659196853637695, -0.0006134510040283203, -0.0004609823226928711, -0.0003085136413574219, -0.00015604496002197266, -3.5762786865234375e-06, 0.00014889240264892578, 0.000301361083984375, 0.0004538297653198242, 0.0006062984466552734, 0.0007587671279907227, 0.0009112358093261719, 0.001063704490661621, 0.0012161731719970703, 0.0013686418533325195, 0.0015211105346679688, 0.001673579216003418, 0.0018260478973388672, 0.0019785165786743164, 0.0021309852600097656, 0.002283453941345215, 0.002435922622680664, 0.0025883913040161133, 0.0027408599853515625, 0.0028933286666870117, 0.003045797348022461, 0.00319826602935791, 0.0033507347106933594, 0.0035032033920288086, 0.003655672073364258, 0.003808140754699707, 0.003960609436035156, 0.0041130781173706055, 0.004265546798706055, 0.004418015480041504, 0.004570484161376953, 0.004722952842712402, 0.0048754215240478516, 0.005027890205383301, 0.00518035888671875]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 6.0, 7.0, 5.0, 2.0, 8.0, 6.0, 14.0, 12.0, 6.0, 18.0, 25.0, 36.0, 38.0, 46.0, 60.0, 68.0, 94.0, 89.0, 93.0, 66.0, 66.0, 50.0, 41.0, 25.0, 29.0, 21.0, 13.0, 10.0, 10.0, 9.0, 9.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.04361720383167267, -0.04209165275096893, -0.0405661016702652, -0.03904055431485176, -0.037515003234148026, -0.03598945215344429, -0.03446390479803085, -0.03293835371732712, -0.03141280263662338, -0.029887251555919647, -0.02836170233786106, -0.026836153119802475, -0.02531060203909874, -0.023785050958395004, -0.022259501740336418, -0.020733952522277832, -0.019208401441574097, -0.01768285036087036, -0.016157301142811775, -0.014631750993430614, -0.013106200844049454, -0.011580650694668293, -0.010055100545287132, -0.008529550395905972, -0.007004000246524811, -0.00547845009714365, -0.003952899947762489, -0.0024273497983813286, -0.0009017996490001678, 0.0006237505003809929, 0.0021493006497621536, 0.0036748507991433144, 0.0052004046738147736, 0.006725954823195934, 0.008251504972577095, 0.009777055121958256, 0.011302605271339417, 0.012828155420720577, 0.014353705570101738, 0.015879254788160324, 0.01740480586886406, 0.018930356949567795, 0.02045590616762638, 0.021981455385684967, 0.023507006466388702, 0.025032557547092438, 0.026558106765151024, 0.02808365598320961, 0.029609207063913345, 0.03113475814461708, 0.03266030550003052, 0.03418585658073425, 0.03571140766143799, 0.037236958742141724, 0.03876250982284546, 0.040288057178258896, 0.04181360825896263, 0.04333915933966637, 0.0448647066950798, 0.04639025777578354, 0.047915808856487274, 0.04944135993719101, 0.050966911017894745, 0.05249245837330818, 0.05401800945401192]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 4.0, 8.0, 9.0, 9.0, 11.0, 10.0, 13.0, 25.0, 23.0, 13.0, 25.0, 13.0, 25.0, 31.0, 36.0, 30.0, 31.0, 42.0, 33.0, 35.0, 35.0, 39.0, 50.0, 40.0, 42.0, 46.0, 34.0, 47.0, 24.0, 25.0, 36.0, 25.0, 21.0, 25.0, 12.0, 10.0, 6.0, 9.0, 12.0, 9.0, 8.0, 5.0, 3.0, 5.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03728503733873367, -0.03613036870956421, -0.034975700080394745, -0.03382103145122528, -0.03266636282205582, -0.03151169419288635, -0.030357027426362038, -0.029202358797192574, -0.02804769016802311, -0.026893021538853645, -0.02573835290968418, -0.024583684280514717, -0.023429017513990402, -0.022274348884820938, -0.021119680255651474, -0.01996501162648201, -0.018810342997312546, -0.01765567436814308, -0.016501005738973618, -0.015346338041126728, -0.014191669411957264, -0.0130370007827878, -0.01188233308494091, -0.010727664455771446, -0.009572995826601982, -0.008418327197432518, -0.007263659033924341, -0.006108990870416164, -0.0049543222412467, -0.003799653612077236, -0.0026449854485690594, -0.0014903172850608826, -0.00033564493060112, 0.0008190234657377005, 0.001973691862076521, 0.0031283602584153414, 0.004283028654754162, 0.005437697283923626, 0.006592365447431803, 0.0077470336109399796, 0.008901702240109444, 0.010056370869278908, 0.011211039498448372, 0.012365707196295261, 0.013520375825464725, 0.01467504445463419, 0.01582971215248108, 0.016984380781650543, 0.018139049410820007, 0.01929371803998947, 0.020448386669158936, 0.0216030552983284, 0.022757723927497864, 0.023912392556667328, 0.025067059323191643, 0.026221727952361107, 0.02737639658153057, 0.028531065210700035, 0.0296857338398695, 0.030840402469038963, 0.03199506923556328, 0.03314973786473274, 0.034304406493902206, 0.03545907512307167, 0.036613743752241135]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 5.0, 9.0, 10.0, 16.0, 24.0, 26.0, 48.0, 78.0, 131.0, 188.0, 258.0, 411.0, 637.0, 1080.0, 1670.0, 2837.0, 4962.0, 8569.0, 15736.0, 30308.0, 61055.0, 134281.0, 378624.0, 1847959.0, 1220649.0, 263202.0, 108424.0, 51590.0, 26691.0, 14482.0, 8092.0, 4675.0, 2785.0, 1724.0, 1090.0, 664.0, 456.0, 302.0, 210.0, 112.0, 86.0, 53.0, 21.0, 20.0, 15.0, 10.0, 6.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06500244140625, -0.06296253204345703, -0.06092262268066406, -0.058882713317871094, -0.056842803955078125, -0.054802894592285156, -0.05276298522949219, -0.05072307586669922, -0.04868316650390625, -0.04664325714111328, -0.04460334777832031, -0.042563438415527344, -0.040523529052734375, -0.038483619689941406, -0.03644371032714844, -0.03440380096435547, -0.0323638916015625, -0.03032398223876953, -0.028284072875976562, -0.026244163513183594, -0.024204254150390625, -0.022164344787597656, -0.020124435424804688, -0.01808452606201172, -0.01604461669921875, -0.014004707336425781, -0.011964797973632812, -0.009924888610839844, -0.007884979248046875, -0.005845069885253906, -0.0038051605224609375, -0.0017652511596679688, 0.000274658203125, 0.0023145675659179688, 0.0043544769287109375, 0.006394386291503906, 0.008434295654296875, 0.010474205017089844, 0.012514114379882812, 0.014554023742675781, 0.01659393310546875, 0.01863384246826172, 0.020673751831054688, 0.022713661193847656, 0.024753570556640625, 0.026793479919433594, 0.028833389282226562, 0.03087329864501953, 0.0329132080078125, 0.03495311737060547, 0.03699302673339844, 0.039032936096191406, 0.041072845458984375, 0.043112754821777344, 0.04515266418457031, 0.04719257354736328, 0.04923248291015625, 0.05127239227294922, 0.05331230163574219, 0.055352210998535156, 0.057392120361328125, 0.059432029724121094, 0.06147193908691406, 0.06351184844970703, 0.0655517578125]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 2.0, 10.0, 8.0, 9.0, 9.0, 9.0, 15.0, 25.0, 12.0, 15.0, 23.0, 23.0, 20.0, 33.0, 36.0, 28.0, 31.0, 37.0, 32.0, 33.0, 47.0, 44.0, 56.0, 43.0, 45.0, 32.0, 40.0, 37.0, 29.0, 35.0, 29.0, 24.0, 18.0, 22.0, 13.0, 14.0, 8.0, 8.0, 4.0, 6.0, 8.0, 3.0, 9.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.0234375, -0.02275228500366211, -0.02206707000732422, -0.021381855010986328, -0.020696640014648438, -0.020011425018310547, -0.019326210021972656, -0.018640995025634766, -0.017955780029296875, -0.017270565032958984, -0.016585350036621094, -0.015900135040283203, -0.015214920043945312, -0.014529705047607422, -0.013844490051269531, -0.01315927505493164, -0.01247406005859375, -0.01178884506225586, -0.011103630065917969, -0.010418415069580078, -0.009733200073242188, -0.009047985076904297, -0.008362770080566406, -0.007677555084228516, -0.006992340087890625, -0.006307125091552734, -0.005621910095214844, -0.004936695098876953, -0.0042514801025390625, -0.003566265106201172, -0.0028810501098632812, -0.0021958351135253906, -0.0015106201171875, -0.0008254051208496094, -0.00014019012451171875, 0.0005450248718261719, 0.0012302398681640625, 0.0019154548645019531, 0.0026006698608398438, 0.0032858848571777344, 0.003971099853515625, 0.004656314849853516, 0.005341529846191406, 0.006026744842529297, 0.0067119598388671875, 0.007397174835205078, 0.008082389831542969, 0.00876760482788086, 0.00945281982421875, 0.01013803482055664, 0.010823249816894531, 0.011508464813232422, 0.012193679809570312, 0.012878894805908203, 0.013564109802246094, 0.014249324798583984, 0.014934539794921875, 0.015619754791259766, 0.016304969787597656, 0.016990184783935547, 0.017675399780273438, 0.018360614776611328, 0.01904582977294922, 0.01973104476928711, 0.020416259765625]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 6.0, 4.0, 3.0, 5.0, 16.0, 11.0, 16.0, 30.0, 37.0, 47.0, 69.0, 89.0, 137.0, 188.0, 297.0, 461.0, 637.0, 950.0, 1502.0, 2263.0, 3716.0, 5903.0, 9763.0, 16382.0, 27745.0, 49428.0, 91407.0, 178445.0, 383694.0, 1026722.0, 1411643.0, 503672.0, 224366.0, 112723.0, 59723.0, 33113.0, 18997.0, 11143.0, 6810.0, 4166.0, 2655.0, 1784.0, 1166.0, 748.0, 483.0, 353.0, 241.0, 180.0, 112.0, 87.0, 50.0, 34.0, 27.0, 16.0, 13.0, 8.0, 8.0, 1.0, 2.0, 1.0], "bins": [-0.04278564453125, -0.04153299331665039, -0.04028034210205078, -0.03902769088745117, -0.03777503967285156, -0.03652238845825195, -0.035269737243652344, -0.034017086029052734, -0.032764434814453125, -0.031511783599853516, -0.030259132385253906, -0.029006481170654297, -0.027753829956054688, -0.026501178741455078, -0.02524852752685547, -0.02399587631225586, -0.02274322509765625, -0.02149057388305664, -0.02023792266845703, -0.018985271453857422, -0.017732620239257812, -0.016479969024658203, -0.015227317810058594, -0.013974666595458984, -0.012722015380859375, -0.011469364166259766, -0.010216712951660156, -0.008964061737060547, -0.0077114105224609375, -0.006458759307861328, -0.005206108093261719, -0.003953456878662109, -0.0027008056640625, -0.0014481544494628906, -0.00019550323486328125, 0.0010571479797363281, 0.0023097991943359375, 0.003562450408935547, 0.004815101623535156, 0.006067752838134766, 0.007320404052734375, 0.008573055267333984, 0.009825706481933594, 0.011078357696533203, 0.012331008911132812, 0.013583660125732422, 0.014836311340332031, 0.01608896255493164, 0.01734161376953125, 0.01859426498413086, 0.01984691619873047, 0.021099567413330078, 0.022352218627929688, 0.023604869842529297, 0.024857521057128906, 0.026110172271728516, 0.027362823486328125, 0.028615474700927734, 0.029868125915527344, 0.031120777130126953, 0.03237342834472656, 0.03362607955932617, 0.03487873077392578, 0.03613138198852539, 0.037384033203125]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 9.0, 3.0, 6.0, 8.0, 9.0, 10.0, 22.0, 10.0, 24.0, 20.0, 23.0, 38.0, 44.0, 66.0, 81.0, 96.0, 94.0, 112.0, 132.0, 139.0, 195.0, 237.0, 242.0, 298.0, 279.0, 251.0, 257.0, 212.0, 198.0, 177.0, 137.0, 130.0, 131.0, 73.0, 59.0, 57.0, 39.0, 38.0, 22.0, 20.0, 16.0, 13.0, 10.0, 10.0, 9.0, 7.0, 5.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.01045989990234375, -0.010093212127685547, -0.009726524353027344, -0.00935983657836914, -0.008993148803710938, -0.008626461029052734, -0.008259773254394531, -0.007893085479736328, -0.007526397705078125, -0.007159709930419922, -0.006793022155761719, -0.006426334381103516, -0.0060596466064453125, -0.005692958831787109, -0.005326271057128906, -0.004959583282470703, -0.0045928955078125, -0.004226207733154297, -0.0038595199584960938, -0.0034928321838378906, -0.0031261444091796875, -0.0027594566345214844, -0.0023927688598632812, -0.002026081085205078, -0.001659393310546875, -0.0012927055358886719, -0.0009260177612304688, -0.0005593299865722656, -0.0001926422119140625, 0.00017404556274414062, 0.0005407333374023438, 0.0009074211120605469, 0.00127410888671875, 0.0016407966613769531, 0.0020074844360351562, 0.0023741722106933594, 0.0027408599853515625, 0.0031075477600097656, 0.0034742355346679688, 0.003840923309326172, 0.004207611083984375, 0.004574298858642578, 0.004940986633300781, 0.005307674407958984, 0.0056743621826171875, 0.006041049957275391, 0.006407737731933594, 0.006774425506591797, 0.00714111328125, 0.007507801055908203, 0.007874488830566406, 0.00824117660522461, 0.008607864379882812, 0.008974552154541016, 0.009341239929199219, 0.009707927703857422, 0.010074615478515625, 0.010441303253173828, 0.010807991027832031, 0.011174678802490234, 0.011541366577148438, 0.01190805435180664, 0.012274742126464844, 0.012641429901123047, 0.01300811767578125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 8.0, 5.0, 5.0, 9.0, 14.0, 9.0, 20.0, 28.0, 27.0, 28.0, 33.0, 51.0, 45.0, 73.0, 70.0, 92.0, 77.0, 64.0, 75.0, 46.0, 39.0, 48.0, 20.0, 25.0, 16.0, 16.0, 8.0, 12.0, 10.0, 8.0, 7.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.033902913331985474, -0.03293386101722717, -0.03196480870246887, -0.03099575638771057, -0.03002670593559742, -0.02905765362083912, -0.028088601306080818, -0.027119548991322517, -0.026150496676564217, -0.025181444361805916, -0.024212392047047615, -0.023243341594934464, -0.022274289280176163, -0.021305236965417862, -0.02033618465065956, -0.01936713233590126, -0.01839808002114296, -0.01742902770638466, -0.016459975391626358, -0.015490924008190632, -0.014521871693432331, -0.013552820309996605, -0.012583767995238304, -0.011614715680480003, -0.010645665228366852, -0.009676612913608551, -0.008707561530172825, -0.007738509215414524, -0.006769456900656223, -0.00580040505155921, -0.004831353202462196, -0.0038623008877038956, -0.002893248572945595, -0.0019241964910179377, -0.0009551445255056024, 1.390744000673294e-05, 0.00098295952193439, 0.0019520116038620472, 0.0029210634529590607, 0.0038901157677173615, 0.004859167616814375, 0.005828219465911388, 0.006797271780669689, 0.007766323629766703, 0.008735375478863716, 0.009704427793622017, 0.010673480108380318, 0.011642532423138618, 0.012611583806574345, 0.013580636121332645, 0.014549687504768372, 0.015518739819526672, 0.016487792134284973, 0.017456844449043274, 0.018425896763801575, 0.019394949078559875, 0.020363999530673027, 0.021333051845431328, 0.02230210416018963, 0.02327115461230278, 0.02424020692706108, 0.02520925924181938, 0.026178311556577682, 0.027147363871335983, 0.028116416186094284]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 5.0, 11.0, 7.0, 10.0, 5.0, 23.0, 17.0, 17.0, 25.0, 22.0, 24.0, 26.0, 39.0, 33.0, 34.0, 32.0, 44.0, 47.0, 39.0, 43.0, 41.0, 31.0, 40.0, 33.0, 30.0, 44.0, 32.0, 31.0, 36.0, 25.0, 23.0, 21.0, 15.0, 17.0, 6.0, 8.0, 14.0, 9.0, 8.0, 8.0, 10.0, 5.0, 3.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.027537813410162926, -0.0267912819981575, -0.026044750586152077, -0.025298219174146652, -0.024551689624786377, -0.023805158212780952, -0.023058626800775528, -0.022312095388770103, -0.02156556397676468, -0.020819032564759254, -0.02007250115275383, -0.019325971603393555, -0.01857944019138813, -0.017832908779382706, -0.01708637736737728, -0.016339845955371857, -0.015593316406011581, -0.014846784994006157, -0.014100254513323307, -0.013353723101317883, -0.012607192620635033, -0.011860661208629608, -0.011114129796624184, -0.01036759838461876, -0.00962106790393591, -0.008874536491930485, -0.008128006011247635, -0.00738147459924221, -0.006634943652898073, -0.005888412706553936, -0.0051418812945485115, -0.004395350348204374, -0.0036488212645053864, -0.002902290318161249, -0.0021557591389864683, -0.0014092279598116875, -0.0006626970134675503, 8.383393287658691e-05, 0.0008303653448820114, 0.0015768962912261486, 0.002323427237570286, 0.003069958183914423, 0.003816489363089204, 0.004563020542263985, 0.005309551488608122, 0.006056082434952259, 0.0068026138469576836, 0.007549144793301821, 0.008295675739645958, 0.009042207151651382, 0.009788737632334232, 0.010535269044339657, 0.011281799525022507, 0.012028330937027931, 0.012774862349033356, 0.01352139376103878, 0.01426792424172163, 0.015014455653727055, 0.015760986134409904, 0.01650751754641533, 0.017254048958420753, 0.018000580370426178, 0.018747109919786453, 0.019493641331791878, 0.020240172743797302]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 4.0, 4.0, 5.0, 5.0, 12.0, 15.0, 20.0, 33.0, 28.0, 57.0, 89.0, 98.0, 160.0, 278.0, 397.0, 576.0, 843.0, 1368.0, 1974.0, 2846.0, 4480.0, 7167.0, 10981.0, 17827.0, 30243.0, 54202.0, 106894.0, 240136.0, 285016.0, 129428.0, 62964.0, 34728.0, 20748.0, 12424.0, 7902.0, 4986.0, 3215.0, 2072.0, 1421.0, 910.0, 602.0, 445.0, 301.0, 217.0, 137.0, 91.0, 70.0, 57.0, 33.0, 24.0, 14.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.01485443115234375, -0.01439201831817627, -0.013929605484008789, -0.013467192649841309, -0.013004779815673828, -0.012542366981506348, -0.012079954147338867, -0.011617541313171387, -0.011155128479003906, -0.010692715644836426, -0.010230302810668945, -0.009767889976501465, -0.009305477142333984, -0.008843064308166504, -0.008380651473999023, -0.007918238639831543, -0.0074558258056640625, -0.006993412971496582, -0.0065310001373291016, -0.006068587303161621, -0.005606174468994141, -0.00514376163482666, -0.00468134880065918, -0.004218935966491699, -0.0037565231323242188, -0.0032941102981567383, -0.002831697463989258, -0.0023692846298217773, -0.0019068717956542969, -0.0014444589614868164, -0.000982046127319336, -0.0005196332931518555, -5.7220458984375e-05, 0.00040519237518310547, 0.0008676052093505859, 0.0013300180435180664, 0.0017924308776855469, 0.0022548437118530273, 0.002717256546020508, 0.0031796693801879883, 0.0036420822143554688, 0.004104495048522949, 0.00456690788269043, 0.00502932071685791, 0.005491733551025391, 0.005954146385192871, 0.0064165592193603516, 0.006878972053527832, 0.0073413848876953125, 0.007803797721862793, 0.008266210556030273, 0.008728623390197754, 0.009191036224365234, 0.009653449058532715, 0.010115861892700195, 0.010578274726867676, 0.011040687561035156, 0.011503100395202637, 0.011965513229370117, 0.012427926063537598, 0.012890338897705078, 0.013352751731872559, 0.013815164566040039, 0.01427757740020752, 0.014739990234375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 9.0, 9.0, 10.0, 10.0, 7.0, 9.0, 19.0, 15.0, 21.0, 22.0, 19.0, 26.0, 32.0, 33.0, 40.0, 42.0, 43.0, 47.0, 43.0, 50.0, 47.0, 35.0, 37.0, 41.0, 42.0, 44.0, 33.0, 41.0, 22.0, 28.0, 23.0, 14.0, 20.0, 10.0, 10.0, 11.0, 10.0, 7.0, 6.0, 3.0, 6.0, 1.0, 6.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0299224853515625, -0.029111385345458984, -0.02830028533935547, -0.027489185333251953, -0.026678085327148438, -0.025866985321044922, -0.025055885314941406, -0.02424478530883789, -0.023433685302734375, -0.02262258529663086, -0.021811485290527344, -0.021000385284423828, -0.020189285278320312, -0.019378185272216797, -0.01856708526611328, -0.017755985260009766, -0.01694488525390625, -0.016133785247802734, -0.015322685241699219, -0.014511585235595703, -0.013700485229492188, -0.012889385223388672, -0.012078285217285156, -0.01126718521118164, -0.010456085205078125, -0.00964498519897461, -0.008833885192871094, -0.008022785186767578, -0.0072116851806640625, -0.006400585174560547, -0.005589485168457031, -0.004778385162353516, -0.00396728515625, -0.0031561851501464844, -0.0023450851440429688, -0.0015339851379394531, -0.0007228851318359375, 8.821487426757812e-05, 0.0008993148803710938, 0.0017104148864746094, 0.002521514892578125, 0.0033326148986816406, 0.004143714904785156, 0.004954814910888672, 0.0057659149169921875, 0.006577014923095703, 0.007388114929199219, 0.008199214935302734, 0.00901031494140625, 0.009821414947509766, 0.010632514953613281, 0.011443614959716797, 0.012254714965820312, 0.013065814971923828, 0.013876914978027344, 0.01468801498413086, 0.015499114990234375, 0.01631021499633789, 0.017121315002441406, 0.017932415008544922, 0.018743515014648438, 0.019554615020751953, 0.02036571502685547, 0.021176815032958984, 0.0219879150390625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 6.0, 10.0, 5.0, 14.0, 17.0, 16.0, 37.0, 31.0, 43.0, 64.0, 81.0, 115.0, 224.0, 267.0, 398.0, 537.0, 734.0, 1119.0, 1625.0, 2442.0, 3727.0, 5634.0, 9760.0, 18580.0, 43492.0, 142817.0, 539219.0, 177534.0, 50384.0, 20742.0, 10448.0, 6347.0, 3901.0, 2545.0, 1694.0, 1196.0, 799.0, 568.0, 411.0, 272.0, 197.0, 141.0, 115.0, 67.0, 63.0, 32.0, 28.0, 17.0, 16.0, 14.0, 7.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0], "bins": [-0.0229644775390625, -0.02218794822692871, -0.021411418914794922, -0.020634889602661133, -0.019858360290527344, -0.019081830978393555, -0.018305301666259766, -0.017528772354125977, -0.016752243041992188, -0.0159757137298584, -0.01519918441772461, -0.01442265510559082, -0.013646125793457031, -0.012869596481323242, -0.012093067169189453, -0.011316537857055664, -0.010540008544921875, -0.009763479232788086, -0.008986949920654297, -0.008210420608520508, -0.007433891296386719, -0.00665736198425293, -0.005880832672119141, -0.0051043033599853516, -0.0043277740478515625, -0.0035512447357177734, -0.0027747154235839844, -0.0019981861114501953, -0.0012216567993164062, -0.0004451274871826172, 0.0003314018249511719, 0.001107931137084961, 0.00188446044921875, 0.002660989761352539, 0.003437519073486328, 0.004214048385620117, 0.004990577697753906, 0.005767107009887695, 0.006543636322021484, 0.0073201656341552734, 0.008096694946289062, 0.008873224258422852, 0.00964975357055664, 0.01042628288269043, 0.011202812194824219, 0.011979341506958008, 0.012755870819091797, 0.013532400131225586, 0.014308929443359375, 0.015085458755493164, 0.015861988067626953, 0.016638517379760742, 0.01741504669189453, 0.01819157600402832, 0.01896810531616211, 0.0197446346282959, 0.020521163940429688, 0.021297693252563477, 0.022074222564697266, 0.022850751876831055, 0.023627281188964844, 0.024403810501098633, 0.025180339813232422, 0.02595686912536621, 0.0267333984375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 7.0, 5.0, 9.0, 10.0, 15.0, 7.0, 10.0, 14.0, 14.0, 17.0, 18.0, 19.0, 30.0, 30.0, 26.0, 27.0, 38.0, 41.0, 34.0, 37.0, 38.0, 32.0, 50.0, 44.0, 34.0, 35.0, 38.0, 31.0, 35.0, 27.0, 38.0, 22.0, 23.0, 25.0, 18.0, 16.0, 19.0, 7.0, 13.0, 8.0, 4.0, 13.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 4.0, 3.0, 0.0, 2.0], "bins": [-0.0156402587890625, -0.015168905258178711, -0.014697551727294922, -0.014226198196411133, -0.013754844665527344, -0.013283491134643555, -0.012812137603759766, -0.012340784072875977, -0.011869430541992188, -0.011398077011108398, -0.01092672348022461, -0.01045536994934082, -0.009984016418457031, -0.009512662887573242, -0.009041309356689453, -0.008569955825805664, -0.008098602294921875, -0.007627248764038086, -0.007155895233154297, -0.006684541702270508, -0.006213188171386719, -0.00574183464050293, -0.005270481109619141, -0.0047991275787353516, -0.0043277740478515625, -0.0038564205169677734, -0.0033850669860839844, -0.0029137134552001953, -0.0024423599243164062, -0.001971006393432617, -0.0014996528625488281, -0.001028299331665039, -0.00055694580078125, -8.559226989746094e-05, 0.0003857612609863281, 0.0008571147918701172, 0.0013284683227539062, 0.0017998218536376953, 0.0022711753845214844, 0.0027425289154052734, 0.0032138824462890625, 0.0036852359771728516, 0.004156589508056641, 0.00462794303894043, 0.005099296569824219, 0.005570650100708008, 0.006042003631591797, 0.006513357162475586, 0.006984710693359375, 0.007456064224243164, 0.007927417755126953, 0.008398771286010742, 0.008870124816894531, 0.00934147834777832, 0.00981283187866211, 0.010284185409545898, 0.010755538940429688, 0.011226892471313477, 0.011698246002197266, 0.012169599533081055, 0.012640953063964844, 0.013112306594848633, 0.013583660125732422, 0.014055013656616211, 0.0145263671875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 12.0, 11.0, 10.0, 14.0, 26.0, 31.0, 33.0, 54.0, 70.0, 128.0, 173.0, 256.0, 330.0, 506.0, 793.0, 1278.0, 2194.0, 4100.0, 9369.0, 27622.0, 207717.0, 725557.0, 43687.0, 12490.0, 5234.0, 2562.0, 1552.0, 893.0, 561.0, 357.0, 270.0, 174.0, 129.0, 98.0, 76.0, 44.0, 34.0, 29.0, 24.0, 14.0, 18.0, 7.0, 5.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00445556640625, -0.004325121641159058, -0.004194676876068115, -0.004064232110977173, -0.0039337873458862305, -0.003803342580795288, -0.0036728978157043457, -0.0035424530506134033, -0.003412008285522461, -0.0032815635204315186, -0.003151118755340576, -0.003020673990249634, -0.0028902292251586914, -0.002759784460067749, -0.0026293396949768066, -0.0024988949298858643, -0.002368450164794922, -0.0022380053997039795, -0.002107560634613037, -0.0019771158695220947, -0.0018466711044311523, -0.00171622633934021, -0.0015857815742492676, -0.0014553368091583252, -0.0013248920440673828, -0.0011944472789764404, -0.001064002513885498, -0.0009335577487945557, -0.0008031129837036133, -0.0006726682186126709, -0.0005422234535217285, -0.00041177868843078613, -0.00028133392333984375, -0.00015088915824890137, -2.0444393157958984e-05, 0.0001100003719329834, 0.00024044513702392578, 0.00037088990211486816, 0.0005013346672058105, 0.0006317794322967529, 0.0007622241973876953, 0.0008926689624786377, 0.00102311372756958, 0.0011535584926605225, 0.0012840032577514648, 0.0014144480228424072, 0.0015448927879333496, 0.001675337553024292, 0.0018057823181152344, 0.0019362270832061768, 0.002066671848297119, 0.0021971166133880615, 0.002327561378479004, 0.0024580061435699463, 0.0025884509086608887, 0.002718895673751831, 0.0028493404388427734, 0.002979785203933716, 0.003110229969024658, 0.0032406747341156006, 0.003371119499206543, 0.0035015642642974854, 0.0036320090293884277, 0.00376245379447937, 0.0038928985595703125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 9.0, 4.0, 0.0, 9.0, 11.0, 20.0, 27.0, 25.0, 41.0, 0.0, 56.0, 74.0, 81.0, 91.0, 106.0, 100.0, 0.0, 82.0, 71.0, 47.0, 37.0, 36.0, 18.0, 0.0, 16.0, 8.0, 6.0, 8.0, 3.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7285346984863281e-06, -1.6773119568824768e-06, -1.6260892152786255e-06, -1.5748664736747742e-06, -1.5236437320709229e-06, -1.4724209904670715e-06, -1.4211982488632202e-06, -1.369975507259369e-06, -1.3187527656555176e-06, -1.2675300240516663e-06, -1.216307282447815e-06, -1.1650845408439636e-06, -1.1138617992401123e-06, -1.062639057636261e-06, -1.0114163160324097e-06, -9.601935744285583e-07, -9.08970832824707e-07, -8.577480912208557e-07, -8.065253496170044e-07, -7.553026080131531e-07, -7.040798664093018e-07, -6.528571248054504e-07, -6.016343832015991e-07, -5.504116415977478e-07, -4.991888999938965e-07, -4.4796615839004517e-07, -3.9674341678619385e-07, -3.4552067518234253e-07, -2.942979335784912e-07, -2.430751919746399e-07, -1.9185245037078857e-07, -1.4062970876693726e-07, -8.940696716308594e-08, -3.818422555923462e-08, 1.30385160446167e-08, 6.426125764846802e-08, 1.1548399925231934e-07, 1.6670674085617065e-07, 2.1792948246002197e-07, 2.691522240638733e-07, 3.203749656677246e-07, 3.7159770727157593e-07, 4.2282044887542725e-07, 4.7404319047927856e-07, 5.252659320831299e-07, 5.764886736869812e-07, 6.277114152908325e-07, 6.789341568946838e-07, 7.301568984985352e-07, 7.813796401023865e-07, 8.326023817062378e-07, 8.838251233100891e-07, 9.350478649139404e-07, 9.862706065177917e-07, 1.037493348121643e-06, 1.0887160897254944e-06, 1.1399388313293457e-06, 1.191161572933197e-06, 1.2423843145370483e-06, 1.2936070561408997e-06, 1.344829797744751e-06, 1.3960525393486023e-06, 1.4472752809524536e-06, 1.498498022556305e-06, 1.5497207641601562e-06]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 9.0, 4.0, 13.0, 8.0, 18.0, 35.0, 34.0, 58.0, 81.0, 111.0, 154.0, 233.0, 320.0, 527.0, 688.0, 1040.0, 1745.0, 2867.0, 5040.0, 9674.0, 21549.0, 67676.0, 589260.0, 264132.0, 47060.0, 17000.0, 7945.0, 4222.0, 2538.0, 1514.0, 979.0, 624.0, 449.0, 264.0, 180.0, 143.0, 92.0, 77.0, 53.0, 34.0, 26.0, 28.0, 14.0, 10.0, 9.0, 7.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0037136077880859375, -0.0036039352416992188, -0.0034942626953125, -0.0033845901489257812, -0.0032749176025390625, -0.0031652450561523438, -0.003055572509765625, -0.0029458999633789062, -0.0028362274169921875, -0.0027265548706054688, -0.00261688232421875, -0.0025072097778320312, -0.0023975372314453125, -0.0022878646850585938, -0.002178192138671875, -0.0020685195922851562, -0.0019588470458984375, -0.0018491744995117188, -0.001739501953125, -0.0016298294067382812, -0.0015201568603515625, -0.0014104843139648438, -0.001300811767578125, -0.0011911392211914062, -0.0010814666748046875, -0.0009717941284179688, -0.00086212158203125, -0.0007524490356445312, -0.0006427764892578125, -0.0005331039428710938, -0.000423431396484375, -0.00031375885009765625, -0.0002040863037109375, -9.441375732421875e-05, 1.52587890625e-05, 0.00012493133544921875, 0.0002346038818359375, 0.00034427642822265625, 0.000453948974609375, 0.0005636215209960938, 0.0006732940673828125, 0.0007829666137695312, 0.00089263916015625, 0.0010023117065429688, 0.0011119842529296875, 0.0012216567993164062, 0.001331329345703125, 0.0014410018920898438, 0.0015506744384765625, 0.0016603469848632812, 0.00177001953125, 0.0018796920776367188, 0.0019893646240234375, 0.0020990371704101562, 0.002208709716796875, 0.0023183822631835938, 0.0024280548095703125, 0.0025377273559570312, 0.00264739990234375, 0.0027570724487304688, 0.0028667449951171875, 0.0029764175415039062, 0.003086090087890625, 0.0031957626342773438, 0.0033054351806640625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 0.0, 3.0, 5.0, 6.0, 10.0, 10.0, 18.0, 19.0, 17.0, 45.0, 53.0, 82.0, 235.0, 210.0, 80.0, 41.0, 50.0, 33.0, 31.0, 9.0, 7.0, 11.0, 8.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009355545043945312, -0.0009021013975143433, -0.0008686482906341553, -0.0008351951837539673, -0.0008017420768737793, -0.0007682889699935913, -0.0007348358631134033, -0.0007013827562332153, -0.0006679296493530273, -0.0006344765424728394, -0.0006010234355926514, -0.0005675703287124634, -0.0005341172218322754, -0.0005006641149520874, -0.0004672110080718994, -0.0004337579011917114, -0.00040030479431152344, -0.00036685168743133545, -0.00033339858055114746, -0.00029994547367095947, -0.0002664923667907715, -0.0002330392599105835, -0.0001995861530303955, -0.00016613304615020752, -0.00013267993927001953, -9.922683238983154e-05, -6.577372550964355e-05, -3.2320618629455566e-05, 1.1324882507324219e-06, 3.458559513092041e-05, 6.80387020111084e-05, 0.00010149180889129639, 0.00013494491577148438, 0.00016839802265167236, 0.00020185112953186035, 0.00023530423641204834, 0.00026875734329223633, 0.0003022104501724243, 0.0003356635570526123, 0.0003691166639328003, 0.0004025697708129883, 0.00043602287769317627, 0.00046947598457336426, 0.0005029290914535522, 0.0005363821983337402, 0.0005698353052139282, 0.0006032884120941162, 0.0006367415189743042, 0.0006701946258544922, 0.0007036477327346802, 0.0007371008396148682, 0.0007705539464950562, 0.0008040070533752441, 0.0008374601602554321, 0.0008709132671356201, 0.0009043663740158081, 0.0009378194808959961, 0.0009712725877761841, 0.001004725694656372, 0.00103817880153656, 0.001071631908416748, 0.001105085015296936, 0.001138538122177124, 0.001171991229057312, 0.0012054443359375]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 8.0, 5.0, 4.0, 8.0, 14.0, 16.0, 22.0, 30.0, 29.0, 31.0, 47.0, 48.0, 63.0, 74.0, 96.0, 83.0, 72.0, 63.0, 59.0, 42.0, 43.0, 18.0, 32.0, 18.0, 10.0, 14.0, 10.0, 11.0, 9.0, 5.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.03354687988758087, -0.03256634250283241, -0.031585805118083954, -0.030605269595980644, -0.029624734073877335, -0.028644196689128876, -0.027663659304380417, -0.026683121919631958, -0.02570258639752865, -0.02472204901278019, -0.02374151349067688, -0.02276097610592842, -0.021780438721179962, -0.020799903199076653, -0.019819365814328194, -0.018838830292224884, -0.017858292907476425, -0.016877755522727966, -0.015897220000624657, -0.014916682615876198, -0.013936146162450314, -0.01295560970902443, -0.01197507232427597, -0.010994535870850086, -0.010013999417424202, -0.009033462963998318, -0.008052926510572433, -0.007072389125823975, -0.00609185267239809, -0.005111316218972206, -0.0041307792998850346, -0.003150242380797863, -0.0021697040647268295, -0.0011891673784703016, -0.00020863069221377373, 0.0007719059940427542, 0.001752442680299282, 0.0027329791337251663, 0.003713516052812338, 0.004694052971899509, 0.005674589425325394, 0.006655125878751278, 0.0076356627978384495, 0.008616199716925621, 0.009596736170351505, 0.01057727262377739, 0.011557810008525848, 0.012538346461951733, 0.013518882915377617, 0.014499419368803501, 0.015479955822229385, 0.016460493206977844, 0.017441030591726303, 0.018421566113829613, 0.01940210349857807, 0.02038263902068138, 0.02136317640542984, 0.0223437137901783, 0.02332424931228161, 0.024304786697030067, 0.025285322219133377, 0.026265859603881836, 0.027246396988630295, 0.028226934373378754, 0.029207469895482063]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 7.0, 5.0, 7.0, 10.0, 11.0, 7.0, 16.0, 19.0, 18.0, 24.0, 20.0, 25.0, 23.0, 36.0, 30.0, 40.0, 32.0, 46.0, 39.0, 44.0, 45.0, 37.0, 37.0, 31.0, 44.0, 24.0, 38.0, 37.0, 35.0, 35.0, 28.0, 19.0, 19.0, 20.0, 17.0, 8.0, 8.0, 13.0, 12.0, 3.0, 12.0, 8.0, 6.0, 5.0, 0.0, 0.0, 4.0, 2.0], "bins": [-0.027385452762246132, -0.02664494886994362, -0.025904444977641106, -0.025163941085338593, -0.02442343533039093, -0.023682931438088417, -0.022942427545785904, -0.02220192365348339, -0.021461419761180878, -0.020720915868878365, -0.01998041197657585, -0.01923990622162819, -0.018499402329325676, -0.017758898437023163, -0.01701839454472065, -0.016277890652418137, -0.015537384897470474, -0.014796881005167961, -0.014056376181542873, -0.01331587228924036, -0.012575367465615273, -0.01183486357331276, -0.011094359681010246, -0.010353855788707733, -0.009613350965082645, -0.008872847072780132, -0.008132342249155045, -0.007391838356852531, -0.006651333998888731, -0.005910829640924931, -0.0051703257486224174, -0.004429821390658617, -0.003689318895339966, -0.0029488145373761654, -0.0022083104122430086, -0.0014678062871098518, -0.0007273019291460514, 1.3202428817749023e-05, 0.0007537063211202621, 0.0014942106790840626, 0.002234715037047863, 0.0029752193950116634, 0.00371572352014482, 0.004456227645277977, 0.005196732003241777, 0.005937236361205578, 0.006677740253508091, 0.007418244611471891, 0.008158748969435692, 0.008899252861738205, 0.009639757685363293, 0.010380261577665806, 0.011120766401290894, 0.011861270293593407, 0.01260177418589592, 0.013342278078198433, 0.01408278290182352, 0.014823286794126034, 0.015563791617751122, 0.016304295510053635, 0.017044799402356148, 0.01778530329465866, 0.018525809049606323, 0.019266312941908836, 0.02000681683421135]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 11.0, 10.0, 12.0, 20.0, 31.0, 46.0, 61.0, 87.0, 119.0, 203.0, 275.0, 390.0, 572.0, 855.0, 1315.0, 1933.0, 2819.0, 4442.0, 6546.0, 10082.0, 15232.0, 24345.0, 38316.0, 63650.0, 109944.0, 212034.0, 240187.0, 125592.0, 70736.0, 42511.0, 26640.0, 16983.0, 10984.0, 7110.0, 4726.0, 3166.0, 2117.0, 1433.0, 921.0, 654.0, 430.0, 302.0, 227.0, 158.0, 99.0, 85.0, 44.0, 40.0, 20.0, 14.0, 16.0, 3.0, 5.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.045257568359375, -0.04389047622680664, -0.04252338409423828, -0.04115629196166992, -0.03978919982910156, -0.0384221076965332, -0.037055015563964844, -0.035687923431396484, -0.034320831298828125, -0.032953739166259766, -0.031586647033691406, -0.030219554901123047, -0.028852462768554688, -0.027485370635986328, -0.02611827850341797, -0.02475118637084961, -0.02338409423828125, -0.02201700210571289, -0.02064990997314453, -0.019282817840576172, -0.017915725708007812, -0.016548633575439453, -0.015181541442871094, -0.013814449310302734, -0.012447357177734375, -0.011080265045166016, -0.009713172912597656, -0.008346080780029297, -0.0069789886474609375, -0.005611896514892578, -0.004244804382324219, -0.0028777122497558594, -0.0015106201171875, -0.00014352798461914062, 0.0012235641479492188, 0.002590656280517578, 0.0039577484130859375, 0.005324840545654297, 0.006691932678222656, 0.008059024810791016, 0.009426116943359375, 0.010793209075927734, 0.012160301208496094, 0.013527393341064453, 0.014894485473632812, 0.016261577606201172, 0.01762866973876953, 0.01899576187133789, 0.02036285400390625, 0.02172994613647461, 0.02309703826904297, 0.024464130401611328, 0.025831222534179688, 0.027198314666748047, 0.028565406799316406, 0.029932498931884766, 0.031299591064453125, 0.032666683197021484, 0.034033775329589844, 0.0354008674621582, 0.03676795959472656, 0.03813505172729492, 0.03950214385986328, 0.04086923599243164, 0.042236328125]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 5.0, 12.0, 9.0, 9.0, 8.0, 16.0, 14.0, 21.0, 22.0, 21.0, 26.0, 35.0, 30.0, 30.0, 30.0, 38.0, 36.0, 46.0, 40.0, 42.0, 46.0, 35.0, 34.0, 31.0, 39.0, 34.0, 32.0, 32.0, 41.0, 23.0, 22.0, 22.0, 15.0, 19.0, 13.0, 7.0, 14.0, 8.0, 10.0, 6.0, 6.0, 9.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0231781005859375, -0.022519826889038086, -0.021861553192138672, -0.021203279495239258, -0.020545005798339844, -0.01988673210144043, -0.019228458404541016, -0.0185701847076416, -0.017911911010742188, -0.017253637313842773, -0.01659536361694336, -0.015937089920043945, -0.015278816223144531, -0.014620542526245117, -0.013962268829345703, -0.013303995132446289, -0.012645721435546875, -0.011987447738647461, -0.011329174041748047, -0.010670900344848633, -0.010012626647949219, -0.009354352951049805, -0.00869607925415039, -0.008037805557250977, -0.0073795318603515625, -0.0067212581634521484, -0.006062984466552734, -0.00540471076965332, -0.004746437072753906, -0.004088163375854492, -0.003429889678955078, -0.002771615982055664, -0.00211334228515625, -0.001455068588256836, -0.0007967948913574219, -0.0001385211944580078, 0.0005197525024414062, 0.0011780261993408203, 0.0018362998962402344, 0.0024945735931396484, 0.0031528472900390625, 0.0038111209869384766, 0.004469394683837891, 0.005127668380737305, 0.005785942077636719, 0.006444215774536133, 0.007102489471435547, 0.007760763168334961, 0.008419036865234375, 0.009077310562133789, 0.009735584259033203, 0.010393857955932617, 0.011052131652832031, 0.011710405349731445, 0.01236867904663086, 0.013026952743530273, 0.013685226440429688, 0.014343500137329102, 0.015001773834228516, 0.01566004753112793, 0.016318321228027344, 0.016976594924926758, 0.017634868621826172, 0.018293142318725586, 0.018951416015625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 9.0, 15.0, 11.0, 17.0, 16.0, 39.0, 60.0, 104.0, 114.0, 163.0, 277.0, 462.0, 700.0, 1096.0, 1682.0, 2602.0, 4453.0, 6919.0, 11916.0, 19633.0, 33485.0, 58089.0, 107903.0, 228982.0, 275814.0, 129625.0, 68311.0, 38567.0, 22609.0, 13484.0, 8157.0, 4870.0, 3116.0, 1904.0, 1170.0, 787.0, 459.0, 331.0, 204.0, 137.0, 95.0, 50.0, 46.0, 24.0, 23.0, 14.0, 4.0, 6.0, 3.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.047271728515625, -0.04570293426513672, -0.04413414001464844, -0.042565345764160156, -0.040996551513671875, -0.039427757263183594, -0.03785896301269531, -0.03629016876220703, -0.03472137451171875, -0.03315258026123047, -0.03158378601074219, -0.030014991760253906, -0.028446197509765625, -0.026877403259277344, -0.025308609008789062, -0.02373981475830078, -0.0221710205078125, -0.02060222625732422, -0.019033432006835938, -0.017464637756347656, -0.015895843505859375, -0.014327049255371094, -0.012758255004882812, -0.011189460754394531, -0.00962066650390625, -0.008051872253417969, -0.0064830780029296875, -0.004914283752441406, -0.003345489501953125, -0.0017766952514648438, -0.0002079010009765625, 0.0013608932495117188, 0.0029296875, 0.004498481750488281, 0.0060672760009765625, 0.007636070251464844, 0.009204864501953125, 0.010773658752441406, 0.012342453002929688, 0.013911247253417969, 0.01548004150390625, 0.01704883575439453, 0.018617630004882812, 0.020186424255371094, 0.021755218505859375, 0.023324012756347656, 0.024892807006835938, 0.02646160125732422, 0.0280303955078125, 0.02959918975830078, 0.031167984008789062, 0.032736778259277344, 0.034305572509765625, 0.035874366760253906, 0.03744316101074219, 0.03901195526123047, 0.04058074951171875, 0.04214954376220703, 0.04371833801269531, 0.045287132263183594, 0.046855926513671875, 0.048424720764160156, 0.04999351501464844, 0.05156230926513672, 0.053131103515625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 10.0, 5.0, 8.0, 14.0, 14.0, 9.0, 23.0, 24.0, 22.0, 19.0, 31.0, 35.0, 35.0, 36.0, 39.0, 50.0, 51.0, 38.0, 52.0, 48.0, 37.0, 38.0, 40.0, 38.0, 40.0, 32.0, 27.0, 16.0, 28.0, 24.0, 20.0, 22.0, 15.0, 9.0, 17.0, 8.0, 8.0, 3.0, 4.0, 2.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01519775390625, -0.014746904373168945, -0.01429605484008789, -0.013845205307006836, -0.013394355773925781, -0.012943506240844727, -0.012492656707763672, -0.012041807174682617, -0.011590957641601562, -0.011140108108520508, -0.010689258575439453, -0.010238409042358398, -0.009787559509277344, -0.009336709976196289, -0.008885860443115234, -0.00843501091003418, -0.007984161376953125, -0.00753331184387207, -0.007082462310791016, -0.006631612777709961, -0.006180763244628906, -0.0057299137115478516, -0.005279064178466797, -0.004828214645385742, -0.0043773651123046875, -0.003926515579223633, -0.003475666046142578, -0.0030248165130615234, -0.0025739669799804688, -0.002123117446899414, -0.0016722679138183594, -0.0012214183807373047, -0.00077056884765625, -0.0003197193145751953, 0.00013113021850585938, 0.0005819797515869141, 0.0010328292846679688, 0.0014836788177490234, 0.0019345283508300781, 0.002385377883911133, 0.0028362274169921875, 0.003287076950073242, 0.003737926483154297, 0.0041887760162353516, 0.004639625549316406, 0.005090475082397461, 0.005541324615478516, 0.00599217414855957, 0.006443023681640625, 0.00689387321472168, 0.007344722747802734, 0.007795572280883789, 0.008246421813964844, 0.008697271347045898, 0.009148120880126953, 0.009598970413208008, 0.010049819946289062, 0.010500669479370117, 0.010951519012451172, 0.011402368545532227, 0.011853218078613281, 0.012304067611694336, 0.01275491714477539, 0.013205766677856445, 0.0136566162109375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 8.0, 15.0, 9.0, 28.0, 23.0, 52.0, 57.0, 75.0, 144.0, 222.0, 301.0, 454.0, 778.0, 1184.0, 1779.0, 2990.0, 4825.0, 8412.0, 15361.0, 34632.0, 170045.0, 705094.0, 54906.0, 20580.0, 10663.0, 6141.0, 3617.0, 2174.0, 1431.0, 870.0, 573.0, 342.0, 260.0, 161.0, 100.0, 71.0, 59.0, 33.0, 29.0, 22.0, 4.0, 2.0, 9.0, 10.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.003292083740234375, -0.0031865835189819336, -0.003081083297729492, -0.0029755830764770508, -0.0028700828552246094, -0.002764582633972168, -0.0026590824127197266, -0.002553582191467285, -0.0024480819702148438, -0.0023425817489624023, -0.002237081527709961, -0.0021315813064575195, -0.002026081085205078, -0.0019205808639526367, -0.0018150806427001953, -0.001709580421447754, -0.0016040802001953125, -0.001498579978942871, -0.0013930797576904297, -0.0012875795364379883, -0.0011820793151855469, -0.0010765790939331055, -0.0009710788726806641, -0.0008655786514282227, -0.0007600784301757812, -0.0006545782089233398, -0.0005490779876708984, -0.00044357776641845703, -0.0003380775451660156, -0.00023257732391357422, -0.0001270771026611328, -2.1576881408691406e-05, 8.392333984375e-05, 0.0001894235610961914, 0.0002949237823486328, 0.0004004240036010742, 0.0005059242248535156, 0.000611424446105957, 0.0007169246673583984, 0.0008224248886108398, 0.0009279251098632812, 0.0010334253311157227, 0.001138925552368164, 0.0012444257736206055, 0.0013499259948730469, 0.0014554262161254883, 0.0015609264373779297, 0.001666426658630371, 0.0017719268798828125, 0.001877427101135254, 0.0019829273223876953, 0.0020884275436401367, 0.002193927764892578, 0.0022994279861450195, 0.002404928207397461, 0.0025104284286499023, 0.0026159286499023438, 0.002721428871154785, 0.0028269290924072266, 0.002932429313659668, 0.0030379295349121094, 0.0031434297561645508, 0.003248929977416992, 0.0033544301986694336, 0.003459930419921875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 2.0, 0.0, 8.0, 0.0, 5.0, 0.0, 27.0, 0.0, 40.0, 0.0, 64.0, 91.0, 0.0, 161.0, 0.0, 189.0, 0.0, 150.0, 0.0, 114.0, 0.0, 66.0, 44.0, 0.0, 20.0, 0.0, 11.0, 0.0, 2.0, 0.0, 7.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1920928955078125e-06, -1.1594966053962708e-06, -1.126900315284729e-06, -1.0943040251731873e-06, -1.0617077350616455e-06, -1.0291114449501038e-06, -9.96515154838562e-07, -9.639188647270203e-07, -9.313225746154785e-07, -8.987262845039368e-07, -8.66129994392395e-07, -8.335337042808533e-07, -8.009374141693115e-07, -7.683411240577698e-07, -7.35744833946228e-07, -7.031485438346863e-07, -6.705522537231445e-07, -6.379559636116028e-07, -6.05359673500061e-07, -5.727633833885193e-07, -5.401670932769775e-07, -5.075708031654358e-07, -4.7497451305389404e-07, -4.423782229423523e-07, -4.0978193283081055e-07, -3.771856427192688e-07, -3.4458935260772705e-07, -3.119930624961853e-07, -2.7939677238464355e-07, -2.468004822731018e-07, -2.1420419216156006e-07, -1.816079020500183e-07, -1.4901161193847656e-07, -1.1641532182693481e-07, -8.381903171539307e-08, -5.122274160385132e-08, -1.862645149230957e-08, 1.3969838619232178e-08, 4.6566128730773926e-08, 7.916241884231567e-08, 1.1175870895385742e-07, 1.4435499906539917e-07, 1.7695128917694092e-07, 2.0954757928848267e-07, 2.421438694000244e-07, 2.7474015951156616e-07, 3.073364496231079e-07, 3.3993273973464966e-07, 3.725290298461914e-07, 4.0512531995773315e-07, 4.377216100692749e-07, 4.7031790018081665e-07, 5.029141902923584e-07, 5.355104804039001e-07, 5.681067705154419e-07, 6.007030606269836e-07, 6.332993507385254e-07, 6.658956408500671e-07, 6.984919309616089e-07, 7.310882210731506e-07, 7.636845111846924e-07, 7.962808012962341e-07, 8.288770914077759e-07, 8.614733815193176e-07, 8.940696716308594e-07]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 12.0, 10.0, 21.0, 20.0, 35.0, 43.0, 47.0, 75.0, 88.0, 131.0, 196.0, 268.0, 373.0, 492.0, 728.0, 995.0, 1343.0, 1952.0, 2759.0, 4039.0, 5925.0, 8734.0, 14697.0, 29262.0, 111843.0, 729044.0, 72440.0, 24188.0, 13000.0, 7977.0, 5223.0, 3709.0, 2511.0, 1802.0, 1318.0, 885.0, 641.0, 466.0, 349.0, 247.0, 192.0, 131.0, 88.0, 63.0, 55.0, 41.0, 30.0, 17.0, 12.0, 14.0, 4.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0028057098388671875, -0.0027163028717041016, -0.0026268959045410156, -0.0025374889373779297, -0.0024480819702148438, -0.002358675003051758, -0.002269268035888672, -0.002179861068725586, -0.0020904541015625, -0.002001047134399414, -0.0019116401672363281, -0.0018222332000732422, -0.0017328262329101562, -0.0016434192657470703, -0.0015540122985839844, -0.0014646053314208984, -0.0013751983642578125, -0.0012857913970947266, -0.0011963844299316406, -0.0011069774627685547, -0.0010175704956054688, -0.0009281635284423828, -0.0008387565612792969, -0.0007493495941162109, -0.000659942626953125, -0.0005705356597900391, -0.0004811286926269531, -0.0003917217254638672, -0.00030231475830078125, -0.0002129077911376953, -0.00012350082397460938, -3.409385681152344e-05, 5.53131103515625e-05, 0.00014472007751464844, 0.00023412704467773438, 0.0003235340118408203, 0.00041294097900390625, 0.0005023479461669922, 0.0005917549133300781, 0.0006811618804931641, 0.00077056884765625, 0.0008599758148193359, 0.0009493827819824219, 0.0010387897491455078, 0.0011281967163085938, 0.0012176036834716797, 0.0013070106506347656, 0.0013964176177978516, 0.0014858245849609375, 0.0015752315521240234, 0.0016646385192871094, 0.0017540454864501953, 0.0018434524536132812, 0.0019328594207763672, 0.002022266387939453, 0.002111673355102539, 0.002201080322265625, 0.002290487289428711, 0.002379894256591797, 0.002469301223754883, 0.0025587081909179688, 0.0026481151580810547, 0.0027375221252441406, 0.0028269290924072266, 0.0029163360595703125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 3.0, 4.0, 4.0, 9.0, 3.0, 4.0, 11.0, 7.0, 10.0, 7.0, 13.0, 17.0, 31.0, 79.0, 174.0, 324.0, 101.0, 60.0, 30.0, 19.0, 10.0, 13.0, 7.0, 7.0, 9.0, 2.0, 8.0, 3.0, 1.0, 7.0, 3.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00080108642578125, -0.0007736161351203918, -0.0007461458444595337, -0.0007186755537986755, -0.0006912052631378174, -0.0006637349724769592, -0.0006362646818161011, -0.0006087943911552429, -0.0005813241004943848, -0.0005538538098335266, -0.0005263835191726685, -0.0004989132285118103, -0.00047144293785095215, -0.000443972647190094, -0.00041650235652923584, -0.0003890320658683777, -0.00036156177520751953, -0.0003340914845466614, -0.0003066211938858032, -0.00027915090322494507, -0.0002516806125640869, -0.00022421032190322876, -0.0001967400312423706, -0.00016926974058151245, -0.0001417994499206543, -0.00011432915925979614, -8.685886859893799e-05, -5.9388577938079834e-05, -3.191828727722168e-05, -4.447996616363525e-06, 2.302229404449463e-05, 5.049258470535278e-05, 7.796287536621094e-05, 0.00010543316602706909, 0.00013290345668792725, 0.0001603737473487854, 0.00018784403800964355, 0.0002153143286705017, 0.00024278461933135986, 0.000270254909992218, 0.00029772520065307617, 0.0003251954913139343, 0.0003526657819747925, 0.00038013607263565063, 0.0004076063632965088, 0.00043507665395736694, 0.0004625469446182251, 0.0004900172352790833, 0.0005174875259399414, 0.0005449578166007996, 0.0005724281072616577, 0.0005998983979225159, 0.000627368688583374, 0.0006548389792442322, 0.0006823092699050903, 0.0007097795605659485, 0.0007372498512268066, 0.0007647201418876648, 0.000792190432548523, 0.0008196607232093811, 0.0008471310138702393, 0.0008746013045310974, 0.0009020715951919556, 0.0009295418858528137, 0.0009570121765136719]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 2.0, 4.0, 5.0, 8.0, 8.0, 11.0, 13.0, 21.0, 32.0, 32.0, 48.0, 66.0, 60.0, 91.0, 98.0, 113.0, 99.0, 55.0, 53.0, 50.0, 32.0, 18.0, 16.0, 18.0, 9.0, 12.0, 7.0, 2.0, 8.0, 2.0, 1.0, 1.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.034813739359378815, -0.03375864773988724, -0.03270355612039566, -0.03164846822619438, -0.030593376606702805, -0.029538284987211227, -0.02848319336771965, -0.027428103610873222, -0.026373013854026794, -0.025317922234535217, -0.02426283247768879, -0.023207740858197212, -0.022152651101350784, -0.021097559481859207, -0.02004246786236763, -0.018987378105521202, -0.017932286486029625, -0.016877194866538048, -0.01582210510969162, -0.014767013490200043, -0.013711923733353615, -0.012656832113862038, -0.011601741425693035, -0.010546650737524033, -0.00949156004935503, -0.008436469361186028, -0.007381378673017025, -0.006326287519186735, -0.005271196831017733, -0.00421610614284873, -0.0031610149890184402, -0.0021059243008494377, -0.0010508336126804352, 4.257191903889179e-06, 0.0010593479964882135, 0.0021144389174878597, 0.0031695296056568623, 0.004224620293825865, 0.005279711447656155, 0.006334802135825157, 0.00738989282399416, 0.008444983512163162, 0.009500074200332165, 0.010555164888501167, 0.011610256507992744, 0.012665346264839172, 0.01372043788433075, 0.014775528572499752, 0.015830619260668755, 0.01688571088016033, 0.01794080063700676, 0.018995892256498337, 0.020050982013344765, 0.021106073632836342, 0.02216116338968277, 0.023216255009174347, 0.024271346628665924, 0.0253264382481575, 0.02638152800500393, 0.027436619624495506, 0.028491709381341934, 0.02954680100083351, 0.03060189262032509, 0.03165698051452637, 0.032712072134017944]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 6.0, 8.0, 7.0, 17.0, 4.0, 7.0, 14.0, 12.0, 19.0, 23.0, 30.0, 27.0, 26.0, 40.0, 35.0, 32.0, 33.0, 35.0, 32.0, 39.0, 33.0, 41.0, 41.0, 41.0, 43.0, 42.0, 22.0, 40.0, 29.0, 34.0, 20.0, 21.0, 23.0, 18.0, 16.0, 19.0, 11.0, 11.0, 15.0, 12.0, 2.0, 6.0, 3.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.02212877757847309, -0.02144228108227253, -0.02075578272342682, -0.020069286227226257, -0.019382789731025696, -0.018696293234825134, -0.018009794875979424, -0.017323298379778862, -0.01663680002093315, -0.01595030352473259, -0.015263806097209454, -0.014577308669686317, -0.013890812173485756, -0.01320431474596262, -0.012517817318439484, -0.011831320822238922, -0.01114482432603836, -0.010458326898515224, -0.009771830402314663, -0.009085332974791527, -0.008398836478590965, -0.007712339051067829, -0.007025841623544693, -0.006339344661682844, -0.005652847699820995, -0.0049663507379591465, -0.004279853776097298, -0.0035933563485741615, -0.0029068593867123127, -0.002220362424850464, -0.0015338649973273277, -0.0008473680354654789, -0.0001608729362487793, 0.0005256241420283914, 0.001212121220305562, 0.0018986184149980545, 0.0025851153768599033, 0.003271612338721752, 0.003958109766244888, 0.004644606728106737, 0.005331103689968586, 0.006017600651830435, 0.006704097613692284, 0.00739059504121542, 0.008077092468738556, 0.008763588964939117, 0.009450086392462254, 0.01013658381998539, 0.010823080316185951, 0.011509577743709087, 0.012196074239909649, 0.012882571667432785, 0.013569068163633347, 0.014255565591156483, 0.014942063018679619, 0.01562855951488018, 0.01631505787372589, 0.017001554369926453, 0.017688052728772163, 0.018374549224972725, 0.019061045721173286, 0.019747544080018997, 0.02043404057621956, 0.02112053707242012, 0.021807033568620682]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 9.0, 13.0, 16.0, 21.0, 32.0, 46.0, 57.0, 91.0, 95.0, 152.0, 205.0, 318.0, 487.0, 603.0, 901.0, 1444.0, 2055.0, 3115.0, 4678.0, 7269.0, 11357.0, 18282.0, 29687.0, 50467.0, 91160.0, 177593.0, 470330.0, 1671708.0, 1038049.0, 292092.0, 134955.0, 73020.0, 42564.0, 25486.0, 15880.0, 10152.0, 6663.0, 4396.0, 2814.0, 1869.0, 1334.0, 904.0, 644.0, 388.0, 275.0, 188.0, 147.0, 89.0, 61.0, 46.0, 23.0, 25.0, 14.0, 11.0, 2.0, 4.0, 4.0, 3.0], "bins": [-0.0311279296875, -0.030206918716430664, -0.029285907745361328, -0.028364896774291992, -0.027443885803222656, -0.02652287483215332, -0.025601863861083984, -0.02468085289001465, -0.023759841918945312, -0.022838830947875977, -0.02191781997680664, -0.020996809005737305, -0.02007579803466797, -0.019154787063598633, -0.018233776092529297, -0.01731276512145996, -0.016391754150390625, -0.015470743179321289, -0.014549732208251953, -0.013628721237182617, -0.012707710266113281, -0.011786699295043945, -0.01086568832397461, -0.009944677352905273, -0.009023666381835938, -0.008102655410766602, -0.007181644439697266, -0.00626063346862793, -0.005339622497558594, -0.004418611526489258, -0.003497600555419922, -0.002576589584350586, -0.00165557861328125, -0.0007345676422119141, 0.00018644332885742188, 0.0011074542999267578, 0.0020284652709960938, 0.0029494762420654297, 0.0038704872131347656, 0.0047914981842041016, 0.0057125091552734375, 0.0066335201263427734, 0.007554531097412109, 0.008475542068481445, 0.009396553039550781, 0.010317564010620117, 0.011238574981689453, 0.012159585952758789, 0.013080596923828125, 0.014001607894897461, 0.014922618865966797, 0.015843629837036133, 0.01676464080810547, 0.017685651779174805, 0.01860666275024414, 0.019527673721313477, 0.020448684692382812, 0.02136969566345215, 0.022290706634521484, 0.02321171760559082, 0.024132728576660156, 0.025053739547729492, 0.025974750518798828, 0.026895761489868164, 0.0278167724609375]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 10.0, 11.0, 6.0, 8.0, 4.0, 18.0, 10.0, 21.0, 24.0, 16.0, 29.0, 22.0, 34.0, 43.0, 39.0, 42.0, 34.0, 35.0, 37.0, 46.0, 35.0, 37.0, 47.0, 42.0, 40.0, 38.0, 26.0, 38.0, 32.0, 22.0, 22.0, 26.0, 19.0, 12.0, 13.0, 11.0, 12.0, 12.0, 5.0, 7.0, 1.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0132293701171875, -0.012815237045288086, -0.012401103973388672, -0.011986970901489258, -0.011572837829589844, -0.01115870475769043, -0.010744571685791016, -0.010330438613891602, -0.009916305541992188, -0.009502172470092773, -0.00908803939819336, -0.008673906326293945, -0.008259773254394531, -0.007845640182495117, -0.007431507110595703, -0.007017374038696289, -0.006603240966796875, -0.006189107894897461, -0.005774974822998047, -0.005360841751098633, -0.004946708679199219, -0.004532575607299805, -0.004118442535400391, -0.0037043094635009766, -0.0032901763916015625, -0.0028760433197021484, -0.0024619102478027344, -0.0020477771759033203, -0.0016336441040039062, -0.0012195110321044922, -0.0008053779602050781, -0.00039124488830566406, 2.288818359375e-05, 0.00043702125549316406, 0.0008511543273925781, 0.0012652873992919922, 0.0016794204711914062, 0.0020935535430908203, 0.0025076866149902344, 0.0029218196868896484, 0.0033359527587890625, 0.0037500858306884766, 0.004164218902587891, 0.004578351974487305, 0.004992485046386719, 0.005406618118286133, 0.005820751190185547, 0.006234884262084961, 0.006649017333984375, 0.007063150405883789, 0.007477283477783203, 0.007891416549682617, 0.008305549621582031, 0.008719682693481445, 0.00913381576538086, 0.009547948837280273, 0.009962081909179688, 0.010376214981079102, 0.010790348052978516, 0.01120448112487793, 0.011618614196777344, 0.012032747268676758, 0.012446880340576172, 0.012861013412475586, 0.013275146484375]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 6.0, 15.0, 18.0, 32.0, 45.0, 88.0, 143.0, 183.0, 300.0, 522.0, 777.0, 1240.0, 1837.0, 2884.0, 4450.0, 6995.0, 10898.0, 17484.0, 28079.0, 47393.0, 81114.0, 147295.0, 289790.0, 649829.0, 1449724.0, 747819.0, 322530.0, 161778.0, 88380.0, 51181.0, 30108.0, 18967.0, 11713.0, 7391.0, 4795.0, 3041.0, 1893.0, 1254.0, 812.0, 527.0, 344.0, 215.0, 145.0, 88.0, 58.0, 36.0, 30.0, 14.0, 12.0, 9.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0214385986328125, -0.02075958251953125, -0.02008056640625, -0.01940155029296875, -0.0187225341796875, -0.01804351806640625, -0.017364501953125, -0.01668548583984375, -0.0160064697265625, -0.01532745361328125, -0.0146484375, -0.01396942138671875, -0.0132904052734375, -0.01261138916015625, -0.011932373046875, -0.01125335693359375, -0.0105743408203125, -0.00989532470703125, -0.00921630859375, -0.00853729248046875, -0.0078582763671875, -0.00717926025390625, -0.006500244140625, -0.00582122802734375, -0.0051422119140625, -0.00446319580078125, -0.0037841796875, -0.00310516357421875, -0.0024261474609375, -0.00174713134765625, -0.001068115234375, -0.00038909912109375, 0.0002899169921875, 0.00096893310546875, 0.00164794921875, 0.00232696533203125, 0.0030059814453125, 0.00368499755859375, 0.004364013671875, 0.00504302978515625, 0.0057220458984375, 0.00640106201171875, 0.007080078125, 0.00775909423828125, 0.0084381103515625, 0.00911712646484375, 0.009796142578125, 0.01047515869140625, 0.0111541748046875, 0.01183319091796875, 0.01251220703125, 0.01319122314453125, 0.0138702392578125, 0.01454925537109375, 0.015228271484375, 0.01590728759765625, 0.0165863037109375, 0.01726531982421875, 0.0179443359375, 0.01862335205078125, 0.0193023681640625, 0.01998138427734375, 0.020660400390625, 0.02133941650390625, 0.0220184326171875]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 5.0, 5.0, 6.0, 8.0, 21.0, 10.0, 15.0, 24.0, 29.0, 44.0, 49.0, 52.0, 54.0, 80.0, 107.0, 105.0, 144.0, 162.0, 218.0, 223.0, 253.0, 255.0, 300.0, 271.0, 248.0, 225.0, 174.0, 167.0, 155.0, 122.0, 102.0, 93.0, 62.0, 42.0, 54.0, 44.0, 33.0, 27.0, 20.0, 18.0, 13.0, 9.0, 5.0, 5.0, 6.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0], "bins": [-0.007808685302734375, -0.007589280605316162, -0.007369875907897949, -0.007150471210479736, -0.0069310665130615234, -0.0067116618156433105, -0.006492257118225098, -0.006272852420806885, -0.006053447723388672, -0.005834043025970459, -0.005614638328552246, -0.005395233631134033, -0.00517582893371582, -0.004956424236297607, -0.0047370195388793945, -0.004517614841461182, -0.004298210144042969, -0.004078805446624756, -0.003859400749206543, -0.00363999605178833, -0.003420591354370117, -0.0032011866569519043, -0.0029817819595336914, -0.0027623772621154785, -0.0025429725646972656, -0.0023235678672790527, -0.00210416316986084, -0.001884758472442627, -0.001665353775024414, -0.0014459490776062012, -0.0012265443801879883, -0.0010071396827697754, -0.0007877349853515625, -0.0005683302879333496, -0.0003489255905151367, -0.00012952089309692383, 8.988380432128906e-05, 0.00030928850173950195, 0.0005286931991577148, 0.0007480978965759277, 0.0009675025939941406, 0.0011869072914123535, 0.0014063119888305664, 0.0016257166862487793, 0.0018451213836669922, 0.002064526081085205, 0.002283930778503418, 0.002503335475921631, 0.0027227401733398438, 0.0029421448707580566, 0.0031615495681762695, 0.0033809542655944824, 0.0036003589630126953, 0.003819763660430908, 0.004039168357849121, 0.004258573055267334, 0.004477977752685547, 0.00469738245010376, 0.004916787147521973, 0.0051361918449401855, 0.0053555965423583984, 0.005575001239776611, 0.005794405937194824, 0.006013810634613037, 0.00623321533203125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 7.0, 7.0, 9.0, 13.0, 17.0, 30.0, 27.0, 47.0, 47.0, 63.0, 76.0, 95.0, 113.0, 93.0, 80.0, 58.0, 40.0, 35.0, 32.0, 29.0, 22.0, 17.0, 9.0, 7.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017520811408758163, -0.016834380105137825, -0.016147948801517487, -0.015461518429219723, -0.014775088056921959, -0.01408865675330162, -0.013402225449681282, -0.012715794146060944, -0.01202936377376318, -0.011342932470142841, -0.010656502097845078, -0.009970070794224739, -0.0092836394906044, -0.008597209118306637, -0.007910777814686298, -0.007224346976727247, -0.006537916138768196, -0.005851485300809145, -0.005165054462850094, -0.004478623159229755, -0.0037921923212707043, -0.003105761483311653, -0.0024193301796913147, -0.0017328993417322636, -0.0010464685037732124, -0.0003600375493988395, 0.0003263934049755335, 0.0010128244757652283, 0.0016992553137242794, 0.0023856861516833305, 0.003072117455303669, 0.00375854829326272, 0.0044449809938669205, 0.005131411831825972, 0.005817842669785023, 0.006504273973405361, 0.007190704811364412, 0.007877135649323463, 0.008563566952943802, 0.00924999825656414, 0.009936428628861904, 0.010622859932482243, 0.011309290304780006, 0.011995721608400345, 0.012682152912020683, 0.013368583284318447, 0.014055014587938786, 0.01474144496023655, 0.015427876263856888, 0.016114307567477226, 0.016800738871097565, 0.017487168312072754, 0.018173599615693092, 0.01886003091931343, 0.01954646222293377, 0.020232893526554108, 0.020919322967529297, 0.021605754271149635, 0.022292185574769974, 0.022978615015745163, 0.0236650463193655, 0.02435147762298584, 0.02503790892660618, 0.025724340230226517, 0.026410771533846855]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 7.0, 9.0, 5.0, 16.0, 8.0, 13.0, 12.0, 23.0, 20.0, 29.0, 30.0, 31.0, 28.0, 38.0, 45.0, 35.0, 55.0, 46.0, 36.0, 39.0, 37.0, 35.0, 25.0, 44.0, 31.0, 39.0, 46.0, 32.0, 24.0, 30.0, 20.0, 19.0, 15.0, 18.0, 16.0, 13.0, 8.0, 7.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.01580195687711239, -0.01533374935388565, -0.014865540899336338, -0.0143973333761096, -0.013929124921560287, -0.01346091739833355, -0.012992709875106812, -0.012524501420557499, -0.012056292966008186, -0.011588085442781448, -0.011119876988232136, -0.010651669465005398, -0.010183461010456085, -0.009715253487229347, -0.00924704596400261, -0.008778837509453297, -0.008310629986226559, -0.00784242246299982, -0.007374214008450508, -0.00690600648522377, -0.0064377980306744576, -0.00596959050744772, -0.005501382518559694, -0.005033174529671669, -0.004564966540783644, -0.0040967585518956184, -0.003628550563007593, -0.0031603428069502115, -0.0026921348180621862, -0.002223926829174161, -0.0017557190731167793, -0.001287511084228754, -0.0008193040266633034, -0.000351096095982939, 0.00011711183469742537, 0.0005853197071701288, 0.001053527696058154, 0.0015217356849461794, 0.001989943441003561, 0.0024581514298915863, 0.0029263594187796116, 0.003394567407667637, 0.003862775396555662, 0.0043309833854436874, 0.004799190908670425, 0.005267399363219738, 0.005735606886446476, 0.006203814875334501, 0.0066720228642225266, 0.007140230853110552, 0.007608438841998577, 0.008076646365225315, 0.008544854819774628, 0.009013062343001366, 0.009481269866228104, 0.009949478320777416, 0.010417686775326729, 0.010885894298553467, 0.01135410275310278, 0.011822310276329517, 0.01229051873087883, 0.012758726254105568, 0.013226933777332306, 0.013695142231881618, 0.014163349755108356]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 4.0, 8.0, 12.0, 21.0, 25.0, 42.0, 53.0, 81.0, 113.0, 167.0, 236.0, 333.0, 482.0, 645.0, 1027.0, 1526.0, 2251.0, 3269.0, 5124.0, 8084.0, 13555.0, 23725.0, 45282.0, 95014.0, 223205.0, 322400.0, 151965.0, 67417.0, 33758.0, 18320.0, 10859.0, 6585.0, 4276.0, 2860.0, 1827.0, 1255.0, 855.0, 589.0, 422.0, 269.0, 202.0, 117.0, 79.0, 70.0, 52.0, 30.0, 20.0, 21.0, 9.0, 3.0, 9.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.00812530517578125, -0.007847785949707031, -0.0075702667236328125, -0.007292747497558594, -0.007015228271484375, -0.006737709045410156, -0.0064601898193359375, -0.006182670593261719, -0.0059051513671875, -0.005627632141113281, -0.0053501129150390625, -0.005072593688964844, -0.004795074462890625, -0.004517555236816406, -0.0042400360107421875, -0.003962516784667969, -0.00368499755859375, -0.0034074783325195312, -0.0031299591064453125, -0.0028524398803710938, -0.002574920654296875, -0.0022974014282226562, -0.0020198822021484375, -0.0017423629760742188, -0.00146484375, -0.0011873245239257812, -0.0009098052978515625, -0.0006322860717773438, -0.000354766845703125, -7.724761962890625e-05, 0.0002002716064453125, 0.00047779083251953125, 0.00075531005859375, 0.0010328292846679688, 0.0013103485107421875, 0.0015878677368164062, 0.001865386962890625, 0.0021429061889648438, 0.0024204254150390625, 0.0026979446411132812, 0.0029754638671875, 0.0032529830932617188, 0.0035305023193359375, 0.0038080215454101562, 0.004085540771484375, 0.004363059997558594, 0.0046405792236328125, 0.004918098449707031, 0.00519561767578125, 0.005473136901855469, 0.0057506561279296875, 0.006028175354003906, 0.006305694580078125, 0.006583213806152344, 0.0068607330322265625, 0.007138252258300781, 0.007415771484375, 0.007693290710449219, 0.007970809936523438, 0.008248329162597656, 0.008525848388671875, 0.008803367614746094, 0.009080886840820312, 0.009358406066894531, 0.00963592529296875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 4.0, 1.0, 8.0, 10.0, 9.0, 8.0, 7.0, 9.0, 12.0, 17.0, 17.0, 24.0, 31.0, 26.0, 25.0, 31.0, 30.0, 32.0, 24.0, 38.0, 42.0, 44.0, 35.0, 41.0, 30.0, 35.0, 32.0, 27.0, 33.0, 34.0, 48.0, 28.0, 25.0, 29.0, 19.0, 18.0, 20.0, 17.0, 13.0, 14.0, 16.0, 6.0, 4.0, 11.0, 5.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.013580322265625, -0.013148903846740723, -0.012717485427856445, -0.012286067008972168, -0.01185464859008789, -0.011423230171203613, -0.010991811752319336, -0.010560393333435059, -0.010128974914550781, -0.009697556495666504, -0.009266138076782227, -0.00883471965789795, -0.008403301239013672, -0.007971882820129395, -0.007540464401245117, -0.00710904598236084, -0.0066776275634765625, -0.006246209144592285, -0.005814790725708008, -0.0053833723068237305, -0.004951953887939453, -0.004520535469055176, -0.0040891170501708984, -0.003657698631286621, -0.0032262802124023438, -0.0027948617935180664, -0.002363443374633789, -0.0019320249557495117, -0.0015006065368652344, -0.001069188117980957, -0.0006377696990966797, -0.00020635128021240234, 0.000225067138671875, 0.0006564855575561523, 0.0010879039764404297, 0.001519322395324707, 0.0019507408142089844, 0.0023821592330932617, 0.002813577651977539, 0.0032449960708618164, 0.0036764144897460938, 0.004107832908630371, 0.0045392513275146484, 0.004970669746398926, 0.005402088165283203, 0.0058335065841674805, 0.006264925003051758, 0.006696343421936035, 0.0071277618408203125, 0.00755918025970459, 0.007990598678588867, 0.008422017097473145, 0.008853435516357422, 0.0092848539352417, 0.009716272354125977, 0.010147690773010254, 0.010579109191894531, 0.011010527610778809, 0.011441946029663086, 0.011873364448547363, 0.01230478286743164, 0.012736201286315918, 0.013167619705200195, 0.013599038124084473, 0.01403045654296875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [5.0, 1.0, 4.0, 2.0, 6.0, 3.0, 7.0, 5.0, 17.0, 33.0, 37.0, 37.0, 66.0, 76.0, 114.0, 177.0, 248.0, 327.0, 510.0, 769.0, 1117.0, 1581.0, 2328.0, 3632.0, 5692.0, 9516.0, 18248.0, 41573.0, 129626.0, 509644.0, 209646.0, 59057.0, 23317.0, 11825.0, 6755.0, 4096.0, 2666.0, 1856.0, 1158.0, 861.0, 599.0, 414.0, 287.0, 166.0, 136.0, 96.0, 78.0, 46.0, 30.0, 31.0, 14.0, 11.0, 8.0, 5.0, 4.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.01291656494140625, -0.012481212615966797, -0.012045860290527344, -0.01161050796508789, -0.011175155639648438, -0.010739803314208984, -0.010304450988769531, -0.009869098663330078, -0.009433746337890625, -0.008998394012451172, -0.008563041687011719, -0.008127689361572266, -0.0076923370361328125, -0.007256984710693359, -0.006821632385253906, -0.006386280059814453, -0.005950927734375, -0.005515575408935547, -0.005080223083496094, -0.004644870758056641, -0.0042095184326171875, -0.0037741661071777344, -0.0033388137817382812, -0.002903461456298828, -0.002468109130859375, -0.002032756805419922, -0.0015974044799804688, -0.0011620521545410156, -0.0007266998291015625, -0.0002913475036621094, 0.00014400482177734375, 0.0005793571472167969, 0.00101470947265625, 0.0014500617980957031, 0.0018854141235351562, 0.0023207664489746094, 0.0027561187744140625, 0.0031914710998535156, 0.0036268234252929688, 0.004062175750732422, 0.004497528076171875, 0.004932880401611328, 0.005368232727050781, 0.005803585052490234, 0.0062389373779296875, 0.006674289703369141, 0.007109642028808594, 0.007544994354248047, 0.0079803466796875, 0.008415699005126953, 0.008851051330566406, 0.00928640365600586, 0.009721755981445312, 0.010157108306884766, 0.010592460632324219, 0.011027812957763672, 0.011463165283203125, 0.011898517608642578, 0.012333869934082031, 0.012769222259521484, 0.013204574584960938, 0.01363992691040039, 0.014075279235839844, 0.014510631561279297, 0.01494598388671875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 4.0, 11.0, 11.0, 16.0, 14.0, 20.0, 24.0, 20.0, 29.0, 41.0, 27.0, 36.0, 31.0, 34.0, 54.0, 43.0, 43.0, 48.0, 45.0, 44.0, 44.0, 44.0, 37.0, 35.0, 29.0, 37.0, 34.0, 17.0, 20.0, 19.0, 23.0, 13.0, 15.0, 11.0, 7.0, 9.0, 7.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0123138427734375, -0.011976361274719238, -0.011638879776000977, -0.011301398277282715, -0.010963916778564453, -0.010626435279846191, -0.01028895378112793, -0.009951472282409668, -0.009613990783691406, -0.009276509284973145, -0.008939027786254883, -0.008601546287536621, -0.00826406478881836, -0.007926583290100098, -0.007589101791381836, -0.007251620292663574, -0.0069141387939453125, -0.006576657295227051, -0.006239175796508789, -0.005901694297790527, -0.005564212799072266, -0.005226731300354004, -0.004889249801635742, -0.0045517683029174805, -0.004214286804199219, -0.003876805305480957, -0.0035393238067626953, -0.0032018423080444336, -0.002864360809326172, -0.00252687931060791, -0.0021893978118896484, -0.0018519163131713867, -0.001514434814453125, -0.0011769533157348633, -0.0008394718170166016, -0.0005019903182983398, -0.00016450881958007812, 0.0001729726791381836, 0.0005104541778564453, 0.000847935676574707, 0.0011854171752929688, 0.0015228986740112305, 0.0018603801727294922, 0.002197861671447754, 0.0025353431701660156, 0.0028728246688842773, 0.003210306167602539, 0.0035477876663208008, 0.0038852691650390625, 0.004222750663757324, 0.004560232162475586, 0.004897713661193848, 0.005235195159912109, 0.005572676658630371, 0.005910158157348633, 0.0062476396560668945, 0.006585121154785156, 0.006922602653503418, 0.00726008415222168, 0.007597565650939941, 0.007935047149658203, 0.008272528648376465, 0.008610010147094727, 0.008947491645812988, 0.00928497314453125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 6.0, 6.0, 8.0, 17.0, 11.0, 14.0, 24.0, 37.0, 33.0, 50.0, 70.0, 105.0, 165.0, 251.0, 390.0, 633.0, 1115.0, 2092.0, 4153.0, 8906.0, 24588.0, 98705.0, 710076.0, 144662.0, 31200.0, 10829.0, 4714.0, 2420.0, 1270.0, 702.0, 421.0, 273.0, 162.0, 122.0, 77.0, 51.0, 51.0, 32.0, 24.0, 25.0, 10.0, 12.0, 14.0, 5.0, 8.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.001617431640625, -0.0015706866979599, -0.0015239417552947998, -0.0014771968126296997, -0.0014304518699645996, -0.0013837069272994995, -0.0013369619846343994, -0.0012902170419692993, -0.0012434720993041992, -0.0011967271566390991, -0.001149982213973999, -0.001103237271308899, -0.0010564923286437988, -0.0010097473859786987, -0.0009630024433135986, -0.0009162575006484985, -0.0008695125579833984, -0.0008227676153182983, -0.0007760226726531982, -0.0007292777299880981, -0.000682532787322998, -0.000635787844657898, -0.0005890429019927979, -0.0005422979593276978, -0.0004955530166625977, -0.00044880807399749756, -0.00040206313133239746, -0.00035531818866729736, -0.00030857324600219727, -0.00026182830333709717, -0.00021508336067199707, -0.00016833841800689697, -0.00012159347534179688, -7.484853267669678e-05, -2.810359001159668e-05, 1.8641352653503418e-05, 6.538629531860352e-05, 0.00011213123798370361, 0.0001588761806488037, 0.0002056211233139038, 0.0002523660659790039, 0.000299111008644104, 0.0003458559513092041, 0.0003926008939743042, 0.0004393458366394043, 0.0004860907793045044, 0.0005328357219696045, 0.0005795806646347046, 0.0006263256072998047, 0.0006730705499649048, 0.0007198154926300049, 0.000766560435295105, 0.0008133053779602051, 0.0008600503206253052, 0.0009067952632904053, 0.0009535402059555054, 0.0010002851486206055, 0.0010470300912857056, 0.0010937750339508057, 0.0011405199766159058, 0.0011872649192810059, 0.001234009861946106, 0.001280754804611206, 0.0013274997472763062, 0.0013742446899414062]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 7.0, 0.0, 9.0, 11.0, 0.0, 16.0, 14.0, 0.0, 24.0, 26.0, 0.0, 42.0, 0.0, 41.0, 49.0, 0.0, 75.0, 75.0, 0.0, 76.0, 83.0, 0.0, 94.0, 56.0, 0.0, 61.0, 65.0, 0.0, 47.0, 42.0, 0.0, 21.0, 12.0, 0.0, 20.0, 14.0, 0.0, 8.0, 7.0, 0.0, 8.0, 5.0, 0.0, 3.0, 4.0], "bins": [-1.5497207641601562e-06, -1.5106052160263062e-06, -1.471489667892456e-06, -1.432374119758606e-06, -1.3932585716247559e-06, -1.3541430234909058e-06, -1.3150274753570557e-06, -1.2759119272232056e-06, -1.2367963790893555e-06, -1.1976808309555054e-06, -1.1585652828216553e-06, -1.1194497346878052e-06, -1.080334186553955e-06, -1.041218638420105e-06, -1.0021030902862549e-06, -9.629875421524048e-07, -9.238719940185547e-07, -8.847564458847046e-07, -8.456408977508545e-07, -8.065253496170044e-07, -7.674098014831543e-07, -7.282942533493042e-07, -6.891787052154541e-07, -6.50063157081604e-07, -6.109476089477539e-07, -5.718320608139038e-07, -5.327165126800537e-07, -4.936009645462036e-07, -4.544854164123535e-07, -4.153698682785034e-07, -3.762543201446533e-07, -3.371387720108032e-07, -2.980232238769531e-07, -2.5890767574310303e-07, -2.1979212760925293e-07, -1.8067657947540283e-07, -1.4156103134155273e-07, -1.0244548320770264e-07, -6.332993507385254e-08, -2.421438694000244e-08, 1.4901161193847656e-08, 5.4016709327697754e-08, 9.313225746154785e-08, 1.3224780559539795e-07, 1.7136335372924805e-07, 2.1047890186309814e-07, 2.4959444999694824e-07, 2.8870999813079834e-07, 3.2782554626464844e-07, 3.6694109439849854e-07, 4.0605664253234863e-07, 4.4517219066619873e-07, 4.842877388000488e-07, 5.234032869338989e-07, 5.62518835067749e-07, 6.016343832015991e-07, 6.407499313354492e-07, 6.798654794692993e-07, 7.189810276031494e-07, 7.580965757369995e-07, 7.972121238708496e-07, 8.363276720046997e-07, 8.754432201385498e-07, 9.145587682723999e-07, 9.5367431640625e-07]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 5.0, 5.0, 10.0, 5.0, 14.0, 16.0, 17.0, 19.0, 28.0, 53.0, 69.0, 89.0, 151.0, 214.0, 264.0, 395.0, 651.0, 1074.0, 1946.0, 3999.0, 9373.0, 25666.0, 95797.0, 651342.0, 192148.0, 39982.0, 13538.0, 5513.0, 2497.0, 1331.0, 770.0, 494.0, 288.0, 221.0, 173.0, 114.0, 85.0, 39.0, 45.0, 29.0, 23.0, 13.0, 12.0, 16.0, 7.0, 7.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0020771026611328125, -0.002013564109802246, -0.0019500255584716797, -0.0018864870071411133, -0.0018229484558105469, -0.0017594099044799805, -0.001695871353149414, -0.0016323328018188477, -0.0015687942504882812, -0.0015052556991577148, -0.0014417171478271484, -0.001378178596496582, -0.0013146400451660156, -0.0012511014938354492, -0.0011875629425048828, -0.0011240243911743164, -0.00106048583984375, -0.0009969472885131836, -0.0009334087371826172, -0.0008698701858520508, -0.0008063316345214844, -0.000742793083190918, -0.0006792545318603516, -0.0006157159805297852, -0.0005521774291992188, -0.0004886388778686523, -0.00042510032653808594, -0.00036156177520751953, -0.0002980232238769531, -0.00023448467254638672, -0.0001709461212158203, -0.0001074075698852539, -4.38690185546875e-05, 1.9669532775878906e-05, 8.320808410644531e-05, 0.00014674663543701172, 0.00021028518676757812, 0.00027382373809814453, 0.00033736228942871094, 0.00040090084075927734, 0.00046443939208984375, 0.0005279779434204102, 0.0005915164947509766, 0.000655055046081543, 0.0007185935974121094, 0.0007821321487426758, 0.0008456707000732422, 0.0009092092514038086, 0.000972747802734375, 0.0010362863540649414, 0.0010998249053955078, 0.0011633634567260742, 0.0012269020080566406, 0.001290440559387207, 0.0013539791107177734, 0.0014175176620483398, 0.0014810562133789062, 0.0015445947647094727, 0.001608133316040039, 0.0016716718673706055, 0.0017352104187011719, 0.0017987489700317383, 0.0018622875213623047, 0.001925826072692871, 0.0019893646240234375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 6.0, 10.0, 13.0, 25.0, 20.0, 36.0, 58.0, 109.0, 165.0, 212.0, 126.0, 81.0, 45.0, 25.0, 23.0, 9.0, 14.0, 6.0, 5.0, 3.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005159378051757812, -0.0004962682723999023, -0.00047659873962402344, -0.00045692920684814453, -0.0004372596740722656, -0.0004175901412963867, -0.0003979206085205078, -0.0003782510757446289, -0.00035858154296875, -0.0003389120101928711, -0.0003192424774169922, -0.0002995729446411133, -0.0002799034118652344, -0.00026023387908935547, -0.00024056434631347656, -0.00022089481353759766, -0.00020122528076171875, -0.00018155574798583984, -0.00016188621520996094, -0.00014221668243408203, -0.00012254714965820312, -0.00010287761688232422, -8.320808410644531e-05, -6.35385513305664e-05, -4.38690185546875e-05, -2.4199485778808594e-05, -4.5299530029296875e-06, 1.5139579772949219e-05, 3.4809112548828125e-05, 5.447864532470703e-05, 7.414817810058594e-05, 9.381771087646484e-05, 0.00011348724365234375, 0.00013315677642822266, 0.00015282630920410156, 0.00017249584197998047, 0.00019216537475585938, 0.00021183490753173828, 0.0002315044403076172, 0.0002511739730834961, 0.000270843505859375, 0.0002905130386352539, 0.0003101825714111328, 0.0003298521041870117, 0.0003495216369628906, 0.00036919116973876953, 0.00038886070251464844, 0.00040853023529052734, 0.00042819976806640625, 0.00044786930084228516, 0.00046753883361816406, 0.00048720836639404297, 0.0005068778991699219, 0.0005265474319458008, 0.0005462169647216797, 0.0005658864974975586, 0.0005855560302734375, 0.0006052255630493164, 0.0006248950958251953, 0.0006445646286010742, 0.0006642341613769531, 0.000683903694152832, 0.0007035732269287109, 0.0007232427597045898, 0.0007429122924804688]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 3.0, 4.0, 7.0, 10.0, 10.0, 18.0, 25.0, 25.0, 45.0, 46.0, 41.0, 72.0, 88.0, 110.0, 113.0, 74.0, 73.0, 44.0, 39.0, 38.0, 24.0, 29.0, 17.0, 10.0, 10.0, 6.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017681382596492767, -0.017001349478960037, -0.016321314498782158, -0.015641281381249428, -0.014961246401071548, -0.014281212352216244, -0.013601178303360939, -0.012921145185828209, -0.01224111020565033, -0.011561076156795025, -0.01088104210793972, -0.010201008059084415, -0.00952097401022911, -0.008840939961373806, -0.008160905912518501, -0.007480872329324484, -0.0068008387461304665, -0.006120804697275162, -0.005440770648419857, -0.004760736599564552, -0.004080702550709248, -0.0034006687346845865, -0.0027206349186599255, -0.0020406008698046207, -0.001360566820949316, -0.0006805328303016722, -4.988396540284157e-07, 0.0006795350927859545, 0.0013595691416412592, 0.002039603190496564, 0.002719637006521225, 0.0033996710553765297, 0.004079705104231834, 0.004759739153087139, 0.005439773201942444, 0.0061198072507977486, 0.006799841299653053, 0.007479875348508358, 0.008159909397363663, 0.008839942514896393, 0.009519977495074272, 0.010200011543929577, 0.010880045592784882, 0.011560079641640186, 0.012240113690495491, 0.012920147739350796, 0.0136001817882061, 0.01428021490573883, 0.014960248954594135, 0.01564028300344944, 0.01632031612098217, 0.01700035110116005, 0.01768038421869278, 0.01836041919887066, 0.01904045231640339, 0.01972048729658127, 0.020400520414114, 0.02108055353164673, 0.021760588511824608, 0.022440621629357338, 0.023120656609535217, 0.023800689727067947, 0.024480724707245827, 0.025160757824778557, 0.025840792804956436]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 9.0, 8.0, 6.0, 14.0, 10.0, 9.0, 19.0, 18.0, 20.0, 32.0, 34.0, 27.0, 27.0, 38.0, 43.0, 39.0, 51.0, 49.0, 32.0, 43.0, 35.0, 33.0, 28.0, 39.0, 33.0, 41.0, 45.0, 32.0, 23.0, 28.0, 21.0, 20.0, 15.0, 19.0, 16.0, 14.0, 6.0, 7.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.015511558391153812, -0.015049237757921219, -0.014586917124688625, -0.014124596491456032, -0.013662276789546013, -0.01319995615631342, -0.012737635523080826, -0.012275314889848232, -0.011812994256615639, -0.011350673623383045, -0.010888352990150452, -0.010426033288240433, -0.00996371265500784, -0.009501392021775246, -0.009039071388542652, -0.008576750755310059, -0.00811443105340004, -0.007652110420167446, -0.00718979025259614, -0.006727469619363546, -0.00626514945179224, -0.005802828818559647, -0.005340508185327053, -0.0048781875520944595, -0.004415867384523153, -0.00395354675129056, -0.0034912265837192535, -0.00302890595048666, -0.00256658555008471, -0.0021042651496827602, -0.0016419445164501667, -0.0011796241160482168, -0.0007173037156462669, -0.00025498325703665614, 0.00020733720157295465, 0.0006696577183902264, 0.0011319781187921762, 0.0015942985191941261, 0.0020566191524267197, 0.0025189395528286695, 0.0029812599532306194, 0.0034435803536325693, 0.003905900754034519, 0.004368221387267113, 0.004830542020499706, 0.0052928621880710125, 0.005755182821303606, 0.006217502988874912, 0.006679823622107506, 0.007142144255340099, 0.0076044644229114056, 0.008066784590482712, 0.008529105223715305, 0.008991425856947899, 0.009453746490180492, 0.009916067123413086, 0.010378386825323105, 0.010840707458555698, 0.011303028091788292, 0.01176534779369831, 0.012227668426930904, 0.012689989060163498, 0.013152309693396091, 0.013614630326628685, 0.014076950959861279]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 7.0, 8.0, 13.0, 15.0, 26.0, 35.0, 48.0, 72.0, 98.0, 151.0, 188.0, 318.0, 429.0, 632.0, 918.0, 1331.0, 1782.0, 2643.0, 3787.0, 5409.0, 7921.0, 12305.0, 18501.0, 28654.0, 44218.0, 71949.0, 120409.0, 204558.0, 202939.0, 119573.0, 71122.0, 44276.0, 28051.0, 18228.0, 12137.0, 7967.0, 5550.0, 3797.0, 2504.0, 1827.0, 1277.0, 885.0, 598.0, 418.0, 312.0, 214.0, 146.0, 104.0, 57.0, 57.0, 25.0, 23.0, 19.0, 14.0, 10.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0], "bins": [-0.02294921875, -0.022208690643310547, -0.021468162536621094, -0.02072763442993164, -0.019987106323242188, -0.019246578216552734, -0.01850605010986328, -0.017765522003173828, -0.017024993896484375, -0.016284465789794922, -0.015543937683105469, -0.014803409576416016, -0.014062881469726562, -0.01332235336303711, -0.012581825256347656, -0.011841297149658203, -0.01110076904296875, -0.010360240936279297, -0.009619712829589844, -0.00887918472290039, -0.008138656616210938, -0.007398128509521484, -0.006657600402832031, -0.005917072296142578, -0.005176544189453125, -0.004436016082763672, -0.0036954879760742188, -0.0029549598693847656, -0.0022144317626953125, -0.0014739036560058594, -0.0007333755493164062, 7.152557373046875e-06, 0.0007476806640625, 0.0014882087707519531, 0.0022287368774414062, 0.0029692649841308594, 0.0037097930908203125, 0.004450321197509766, 0.005190849304199219, 0.005931377410888672, 0.006671905517578125, 0.007412433624267578, 0.008152961730957031, 0.008893489837646484, 0.009634017944335938, 0.01037454605102539, 0.011115074157714844, 0.011855602264404297, 0.01259613037109375, 0.013336658477783203, 0.014077186584472656, 0.01481771469116211, 0.015558242797851562, 0.016298770904541016, 0.01703929901123047, 0.017779827117919922, 0.018520355224609375, 0.019260883331298828, 0.02000141143798828, 0.020741939544677734, 0.021482467651367188, 0.02222299575805664, 0.022963523864746094, 0.023704051971435547, 0.024444580078125]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 10.0, 5.0, 9.0, 7.0, 16.0, 16.0, 21.0, 19.0, 26.0, 29.0, 33.0, 30.0, 42.0, 38.0, 49.0, 40.0, 46.0, 45.0, 38.0, 49.0, 35.0, 38.0, 40.0, 43.0, 41.0, 34.0, 30.0, 15.0, 27.0, 24.0, 12.0, 22.0, 16.0, 15.0, 9.0, 8.0, 12.0, 2.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.01390838623046875, -0.013493061065673828, -0.013077735900878906, -0.012662410736083984, -0.012247085571289062, -0.01183176040649414, -0.011416435241699219, -0.011001110076904297, -0.010585784912109375, -0.010170459747314453, -0.009755134582519531, -0.00933980941772461, -0.008924484252929688, -0.008509159088134766, -0.008093833923339844, -0.007678508758544922, -0.00726318359375, -0.006847858428955078, -0.006432533264160156, -0.006017208099365234, -0.0056018829345703125, -0.005186557769775391, -0.004771232604980469, -0.004355907440185547, -0.003940582275390625, -0.003525257110595703, -0.0031099319458007812, -0.0026946067810058594, -0.0022792816162109375, -0.0018639564514160156, -0.0014486312866210938, -0.0010333061218261719, -0.00061798095703125, -0.00020265579223632812, 0.00021266937255859375, 0.0006279945373535156, 0.0010433197021484375, 0.0014586448669433594, 0.0018739700317382812, 0.002289295196533203, 0.002704620361328125, 0.003119945526123047, 0.0035352706909179688, 0.003950595855712891, 0.0043659210205078125, 0.004781246185302734, 0.005196571350097656, 0.005611896514892578, 0.0060272216796875, 0.006442546844482422, 0.006857872009277344, 0.007273197174072266, 0.0076885223388671875, 0.00810384750366211, 0.008519172668457031, 0.008934497833251953, 0.009349822998046875, 0.009765148162841797, 0.010180473327636719, 0.01059579849243164, 0.011011123657226562, 0.011426448822021484, 0.011841773986816406, 0.012257099151611328, 0.01267242431640625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 14.0, 12.0, 26.0, 49.0, 55.0, 91.0, 134.0, 222.0, 357.0, 643.0, 1088.0, 1912.0, 3101.0, 5106.0, 8784.0, 14741.0, 25598.0, 44153.0, 78832.0, 149424.0, 287939.0, 195832.0, 99438.0, 55194.0, 31142.0, 18512.0, 10793.0, 6111.0, 3775.0, 2151.0, 1308.0, 751.0, 467.0, 305.0, 183.0, 105.0, 69.0, 55.0, 28.0, 19.0, 12.0, 7.0, 8.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.031585693359375, -0.030675172805786133, -0.029764652252197266, -0.0288541316986084, -0.02794361114501953, -0.027033090591430664, -0.026122570037841797, -0.02521204948425293, -0.024301528930664062, -0.023391008377075195, -0.022480487823486328, -0.02156996726989746, -0.020659446716308594, -0.019748926162719727, -0.01883840560913086, -0.017927885055541992, -0.017017364501953125, -0.016106843948364258, -0.01519632339477539, -0.014285802841186523, -0.013375282287597656, -0.012464761734008789, -0.011554241180419922, -0.010643720626831055, -0.009733200073242188, -0.00882267951965332, -0.007912158966064453, -0.007001638412475586, -0.006091117858886719, -0.0051805973052978516, -0.004270076751708984, -0.003359556198120117, -0.00244903564453125, -0.0015385150909423828, -0.0006279945373535156, 0.00028252601623535156, 0.0011930465698242188, 0.002103567123413086, 0.003014087677001953, 0.00392460823059082, 0.0048351287841796875, 0.005745649337768555, 0.006656169891357422, 0.007566690444946289, 0.008477210998535156, 0.009387731552124023, 0.01029825210571289, 0.011208772659301758, 0.012119293212890625, 0.013029813766479492, 0.01394033432006836, 0.014850854873657227, 0.015761375427246094, 0.01667189598083496, 0.017582416534423828, 0.018492937088012695, 0.019403457641601562, 0.02031397819519043, 0.021224498748779297, 0.022135019302368164, 0.02304553985595703, 0.0239560604095459, 0.024866580963134766, 0.025777101516723633, 0.0266876220703125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 4.0, 6.0, 3.0, 7.0, 6.0, 7.0, 15.0, 11.0, 13.0, 16.0, 20.0, 16.0, 16.0, 23.0, 21.0, 19.0, 24.0, 20.0, 18.0, 23.0, 38.0, 44.0, 28.0, 35.0, 34.0, 39.0, 33.0, 26.0, 36.0, 27.0, 32.0, 42.0, 25.0, 27.0, 27.0, 26.0, 25.0, 16.0, 28.0, 22.0, 16.0, 11.0, 9.0, 9.0, 13.0, 8.0, 9.0, 6.0, 9.0, 8.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.006793975830078125, -0.006586551666259766, -0.006379127502441406, -0.006171703338623047, -0.0059642791748046875, -0.005756855010986328, -0.005549430847167969, -0.005342006683349609, -0.00513458251953125, -0.004927158355712891, -0.004719734191894531, -0.004512310028076172, -0.0043048858642578125, -0.004097461700439453, -0.0038900375366210938, -0.0036826133728027344, -0.003475189208984375, -0.0032677650451660156, -0.0030603408813476562, -0.002852916717529297, -0.0026454925537109375, -0.002438068389892578, -0.0022306442260742188, -0.0020232200622558594, -0.0018157958984375, -0.0016083717346191406, -0.0014009475708007812, -0.0011935234069824219, -0.0009860992431640625, -0.0007786750793457031, -0.0005712509155273438, -0.0003638267517089844, -0.000156402587890625, 5.1021575927734375e-05, 0.00025844573974609375, 0.0004658699035644531, 0.0006732940673828125, 0.0008807182312011719, 0.0010881423950195312, 0.0012955665588378906, 0.00150299072265625, 0.0017104148864746094, 0.0019178390502929688, 0.002125263214111328, 0.0023326873779296875, 0.002540111541748047, 0.0027475357055664062, 0.0029549598693847656, 0.003162384033203125, 0.0033698081970214844, 0.0035772323608398438, 0.003784656524658203, 0.0039920806884765625, 0.004199504852294922, 0.004406929016113281, 0.004614353179931641, 0.00482177734375, 0.005029201507568359, 0.005236625671386719, 0.005444049835205078, 0.0056514739990234375, 0.005858898162841797, 0.006066322326660156, 0.006273746490478516, 0.006481170654296875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 10.0, 19.0, 9.0, 24.0, 51.0, 60.0, 73.0, 147.0, 186.0, 260.0, 379.0, 503.0, 671.0, 968.0, 1297.0, 1900.0, 2770.0, 4142.0, 6464.0, 11130.0, 21233.0, 60828.0, 687985.0, 172776.0, 34436.0, 15031.0, 8533.0, 5289.0, 3484.0, 2430.0, 1594.0, 1135.0, 749.0, 536.0, 384.0, 292.0, 231.0, 160.0, 105.0, 85.0, 47.0, 35.0, 37.0, 27.0, 13.0, 15.0, 7.0, 6.0, 2.0, 3.0, 2.0], "bins": [-0.0017576217651367188, -0.0017084777355194092, -0.0016593337059020996, -0.00161018967628479, -0.0015610456466674805, -0.001511901617050171, -0.0014627575874328613, -0.0014136135578155518, -0.0013644695281982422, -0.0013153254985809326, -0.001266181468963623, -0.0012170374393463135, -0.001167893409729004, -0.0011187493801116943, -0.0010696053504943848, -0.0010204613208770752, -0.0009713172912597656, -0.0009221732616424561, -0.0008730292320251465, -0.0008238852024078369, -0.0007747411727905273, -0.0007255971431732178, -0.0006764531135559082, -0.0006273090839385986, -0.0005781650543212891, -0.0005290210247039795, -0.0004798769950866699, -0.00043073296546936035, -0.0003815889358520508, -0.0003324449062347412, -0.00028330087661743164, -0.00023415684700012207, -0.0001850128173828125, -0.00013586878776550293, -8.672475814819336e-05, -3.758072853088379e-05, 1.1563301086425781e-05, 6.070733070373535e-05, 0.00010985136032104492, 0.0001589953899383545, 0.00020813941955566406, 0.00025728344917297363, 0.0003064274787902832, 0.0003555715084075928, 0.00040471553802490234, 0.0004538595676422119, 0.0005030035972595215, 0.0005521476268768311, 0.0006012916564941406, 0.0006504356861114502, 0.0006995797157287598, 0.0007487237453460693, 0.0007978677749633789, 0.0008470118045806885, 0.000896155834197998, 0.0009452998638153076, 0.0009944438934326172, 0.0010435879230499268, 0.0010927319526672363, 0.001141875982284546, 0.0011910200119018555, 0.001240164041519165, 0.0012893080711364746, 0.0013384521007537842, 0.0013875961303710938]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 5.0, 0.0, 12.0, 0.0, 23.0, 0.0, 39.0, 0.0, 57.0, 0.0, 0.0, 104.0, 0.0, 149.0, 0.0, 190.0, 0.0, 177.0, 0.0, 115.0, 0.0, 0.0, 64.0, 0.0, 25.0, 0.0, 21.0, 0.0, 6.0, 0.0, 1.0, 0.0, 0.0, 8.0, 0.0, 5.0, 0.0, 3.0, 0.0, 5.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.152557373046875e-07, -6.882473826408386e-07, -6.612390279769897e-07, -6.342306733131409e-07, -6.07222318649292e-07, -5.802139639854431e-07, -5.532056093215942e-07, -5.261972546577454e-07, -4.991888999938965e-07, -4.721805453300476e-07, -4.4517219066619873e-07, -4.1816383600234985e-07, -3.91155481338501e-07, -3.641471266746521e-07, -3.371387720108032e-07, -3.1013041734695435e-07, -2.8312206268310547e-07, -2.561137080192566e-07, -2.2910535335540771e-07, -2.0209699869155884e-07, -1.7508864402770996e-07, -1.4808028936386108e-07, -1.210719347000122e-07, -9.406358003616333e-08, -6.705522537231445e-08, -4.0046870708465576e-08, -1.30385160446167e-08, 1.3969838619232178e-08, 4.0978193283081055e-08, 6.798654794692993e-08, 9.499490261077881e-08, 1.2200325727462769e-07, 1.4901161193847656e-07, 1.7601996660232544e-07, 2.0302832126617432e-07, 2.300366759300232e-07, 2.5704503059387207e-07, 2.8405338525772095e-07, 3.110617399215698e-07, 3.380700945854187e-07, 3.650784492492676e-07, 3.9208680391311646e-07, 4.1909515857696533e-07, 4.461035132408142e-07, 4.731118679046631e-07, 5.00120222568512e-07, 5.271285772323608e-07, 5.541369318962097e-07, 5.811452865600586e-07, 6.081536412239075e-07, 6.351619958877563e-07, 6.621703505516052e-07, 6.891787052154541e-07, 7.16187059879303e-07, 7.431954145431519e-07, 7.702037692070007e-07, 7.972121238708496e-07, 8.242204785346985e-07, 8.512288331985474e-07, 8.782371878623962e-07, 9.052455425262451e-07, 9.32253897190094e-07, 9.592622518539429e-07, 9.862706065177917e-07, 1.0132789611816406e-06]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 5.0, 12.0, 16.0, 23.0, 19.0, 34.0, 32.0, 58.0, 78.0, 117.0, 176.0, 208.0, 368.0, 546.0, 826.0, 1276.0, 2081.0, 3378.0, 5769.0, 10627.0, 23306.0, 102137.0, 794773.0, 61442.0, 18898.0, 8976.0, 5064.0, 3002.0, 1863.0, 1181.0, 744.0, 479.0, 317.0, 201.0, 147.0, 105.0, 69.0, 52.0, 39.0, 25.0, 27.0, 20.0, 9.0, 8.0, 10.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0020351409912109375, -0.001972287893295288, -0.0019094347953796387, -0.0018465816974639893, -0.0017837285995483398, -0.0017208755016326904, -0.001658022403717041, -0.0015951693058013916, -0.0015323162078857422, -0.0014694631099700928, -0.0014066100120544434, -0.001343756914138794, -0.0012809038162231445, -0.0012180507183074951, -0.0011551976203918457, -0.0010923445224761963, -0.0010294914245605469, -0.0009666383266448975, -0.000903785228729248, -0.0008409321308135986, -0.0007780790328979492, -0.0007152259349822998, -0.0006523728370666504, -0.000589519739151001, -0.0005266666412353516, -0.00046381354331970215, -0.00040096044540405273, -0.0003381073474884033, -0.0002752542495727539, -0.0002124011516571045, -0.00014954805374145508, -8.669495582580566e-05, -2.384185791015625e-05, 3.9011240005493164e-05, 0.00010186433792114258, 0.000164717435836792, 0.0002275705337524414, 0.0002904236316680908, 0.00035327672958374023, 0.00041612982749938965, 0.00047898292541503906, 0.0005418360233306885, 0.0006046891212463379, 0.0006675422191619873, 0.0007303953170776367, 0.0007932484149932861, 0.0008561015129089355, 0.000918954610824585, 0.0009818077087402344, 0.0010446608066558838, 0.0011075139045715332, 0.0011703670024871826, 0.001233220100402832, 0.0012960731983184814, 0.0013589262962341309, 0.0014217793941497803, 0.0014846324920654297, 0.001547485589981079, 0.0016103386878967285, 0.001673191785812378, 0.0017360448837280273, 0.0017988979816436768, 0.0018617510795593262, 0.0019246041774749756, 0.001987457275390625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 4.0, 5.0, 4.0, 6.0, 5.0, 9.0, 19.0, 15.0, 31.0, 66.0, 209.0, 339.0, 126.0, 58.0, 24.0, 14.0, 14.0, 7.0, 7.0, 12.0, 4.0, 4.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006184577941894531, -0.0005993545055389404, -0.0005802512168884277, -0.000561147928237915, -0.0005420446395874023, -0.0005229413509368896, -0.000503838062286377, -0.00048473477363586426, -0.00046563148498535156, -0.00044652819633483887, -0.00042742490768432617, -0.0004083216190338135, -0.0003892183303833008, -0.0003701150417327881, -0.0003510117530822754, -0.0003319084644317627, -0.00031280517578125, -0.0002937018871307373, -0.0002745985984802246, -0.0002554953098297119, -0.00023639202117919922, -0.00021728873252868652, -0.00019818544387817383, -0.00017908215522766113, -0.00015997886657714844, -0.00014087557792663574, -0.00012177228927612305, -0.00010266900062561035, -8.356571197509766e-05, -6.446242332458496e-05, -4.5359134674072266e-05, -2.625584602355957e-05, -7.152557373046875e-06, 1.195073127746582e-05, 3.1054019927978516e-05, 5.015730857849121e-05, 6.92605972290039e-05, 8.83638858795166e-05, 0.0001074671745300293, 0.000126570463180542, 0.0001456737518310547, 0.00016477704048156738, 0.00018388032913208008, 0.00020298361778259277, 0.00022208690643310547, 0.00024119019508361816, 0.00026029348373413086, 0.00027939677238464355, 0.00029850006103515625, 0.00031760334968566895, 0.00033670663833618164, 0.00035580992698669434, 0.00037491321563720703, 0.0003940165042877197, 0.0004131197929382324, 0.0004322230815887451, 0.0004513263702392578, 0.0004704296588897705, 0.0004895329475402832, 0.0005086362361907959, 0.0005277395248413086, 0.0005468428134918213, 0.000565946102142334, 0.0005850493907928467, 0.0006041526794433594]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 5.0, 8.0, 5.0, 12.0, 17.0, 21.0, 20.0, 33.0, 36.0, 53.0, 69.0, 87.0, 106.0, 107.0, 81.0, 78.0, 53.0, 40.0, 41.0, 35.0, 28.0, 15.0, 6.0, 5.0, 10.0, 7.0, 3.0, 3.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01572066731750965, -0.015124631114304066, -0.01452859491109848, -0.01393255963921547, -0.013336523436009884, -0.012740487232804298, -0.012144451960921288, -0.011548415757715702, -0.010952379554510117, -0.010356343351304531, -0.009760307148098946, -0.009164271876215935, -0.00856823567301035, -0.007972199469804764, -0.007376163732260466, -0.0067801279947161674, -0.006184091791510582, -0.0055880555883049965, -0.004992019850760698, -0.0043959841132164, -0.0037999479100108147, -0.003203911939635873, -0.002607875969260931, -0.002011840231716633, -0.0014158040285110474, -0.0008197680581361055, -0.0002237320877611637, 0.0003723038826137781, 0.0009683398529887199, 0.0015643758233636618, 0.0021604117937386036, 0.0027564475312829018, 0.0033524837344884872, 0.003948519937694073, 0.004544555675238371, 0.005140591412782669, 0.0057366276159882545, 0.00633266381919384, 0.006928699556738138, 0.007524735294282436, 0.008120771497488022, 0.008716807700693607, 0.009312843903899193, 0.009908879175782204, 0.01050491537898779, 0.011100951582193375, 0.011696986854076385, 0.012293023057281971, 0.012889059260487556, 0.013485095463693142, 0.014081131666898727, 0.014677166938781738, 0.015273203141987324, 0.01586923934519291, 0.01646527461707592, 0.01706131175160408, 0.01765734702348709, 0.018253382295370102, 0.018849419429898262, 0.019445454701781273, 0.020041491836309433, 0.020637527108192444, 0.021233562380075455, 0.021829597651958466, 0.022425634786486626]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 8.0, 1.0, 8.0, 8.0, 16.0, 11.0, 13.0, 15.0, 15.0, 26.0, 21.0, 21.0, 39.0, 35.0, 43.0, 30.0, 42.0, 28.0, 30.0, 47.0, 51.0, 45.0, 39.0, 40.0, 23.0, 46.0, 37.0, 40.0, 32.0, 29.0, 27.0, 18.0, 17.0, 17.0, 14.0, 15.0, 15.0, 7.0, 10.0, 7.0, 5.0, 2.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.014121543616056442, -0.013714209198951721, -0.013306875713169575, -0.012899541296064854, -0.012492206878960133, -0.012084873393177986, -0.011677538976073265, -0.011270204558968544, -0.010862870141863823, -0.010455535724759102, -0.010048202238976955, -0.009640867821872234, -0.009233533404767513, -0.008826199918985367, -0.008418865501880646, -0.008011531084775925, -0.007604197598993778, -0.0071968636475503445, -0.006789529230445623, -0.00638219527900219, -0.005974860861897469, -0.005567526910454035, -0.005160192959010601, -0.00475285854190588, -0.004345524590462446, -0.0039381906390190125, -0.0035308562219142914, -0.0031235222704708576, -0.00271618808619678, -0.002308853901922703, -0.001901519950479269, -0.0014941857662051916, -0.0010868506506085396, -0.0006795165245421231, -0.0002721823984757066, 0.000135151669383049, 0.0005424858536571264, 0.0009498200379312038, 0.0013571539893746376, 0.001764488173648715, 0.0021718223579227924, 0.00257915654219687, 0.0029864907264709473, 0.003393824677914381, 0.0038011588621884584, 0.004208493046462536, 0.00461582699790597, 0.005023160949349403, 0.0054304953664541245, 0.005837829317897558, 0.006245163735002279, 0.006652497686445713, 0.007059832103550434, 0.007467166054993868, 0.007874500006437302, 0.008281834423542023, 0.008689168840646744, 0.009096503257751465, 0.009503836743533611, 0.009911171160638332, 0.010318505577743053, 0.0107258390635252, 0.011133173480629921, 0.011540507897734642, 0.011947841383516788]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 7.0, 6.0, 16.0, 15.0, 26.0, 31.0, 64.0, 68.0, 115.0, 138.0, 187.0, 271.0, 398.0, 580.0, 831.0, 1223.0, 1765.0, 2681.0, 4016.0, 6186.0, 9512.0, 14634.0, 23201.0, 37757.0, 62045.0, 107964.0, 207517.0, 561055.0, 1644125.0, 901595.0, 279423.0, 132655.0, 73760.0, 43843.0, 27060.0, 17271.0, 10913.0, 7073.0, 4739.0, 3104.0, 2110.0, 1403.0, 928.0, 628.0, 419.0, 278.0, 180.0, 136.0, 85.0, 65.0, 47.0, 30.0, 39.0, 18.0, 17.0, 18.0, 8.0, 7.0, 5.0, 5.0, 2.0, 2.0], "bins": [-0.0147552490234375, -0.014274358749389648, -0.013793468475341797, -0.013312578201293945, -0.012831687927246094, -0.012350797653198242, -0.01186990737915039, -0.011389017105102539, -0.010908126831054688, -0.010427236557006836, -0.009946346282958984, -0.009465456008911133, -0.008984565734863281, -0.00850367546081543, -0.008022785186767578, -0.0075418949127197266, -0.007061004638671875, -0.0065801143646240234, -0.006099224090576172, -0.00561833381652832, -0.005137443542480469, -0.004656553268432617, -0.004175662994384766, -0.003694772720336914, -0.0032138824462890625, -0.002732992172241211, -0.0022521018981933594, -0.0017712116241455078, -0.0012903213500976562, -0.0008094310760498047, -0.0003285408020019531, 0.00015234947204589844, 0.00063323974609375, 0.0011141300201416016, 0.0015950202941894531, 0.0020759105682373047, 0.0025568008422851562, 0.003037691116333008, 0.0035185813903808594, 0.003999471664428711, 0.0044803619384765625, 0.004961252212524414, 0.005442142486572266, 0.005923032760620117, 0.006403923034667969, 0.00688481330871582, 0.007365703582763672, 0.007846593856811523, 0.008327484130859375, 0.008808374404907227, 0.009289264678955078, 0.00977015495300293, 0.010251045227050781, 0.010731935501098633, 0.011212825775146484, 0.011693716049194336, 0.012174606323242188, 0.012655496597290039, 0.01313638687133789, 0.013617277145385742, 0.014098167419433594, 0.014579057693481445, 0.015059947967529297, 0.015540838241577148, 0.016021728515625]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 5.0, 4.0, 9.0, 12.0, 16.0, 11.0, 22.0, 16.0, 15.0, 13.0, 29.0, 27.0, 38.0, 40.0, 46.0, 45.0, 32.0, 27.0, 39.0, 49.0, 57.0, 48.0, 44.0, 31.0, 31.0, 40.0, 44.0, 32.0, 29.0, 21.0, 21.0, 16.0, 16.0, 13.0, 9.0, 11.0, 10.0, 8.0, 7.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.0084228515625, -0.008180797100067139, -0.007938742637634277, -0.007696688175201416, -0.007454633712768555, -0.007212579250335693, -0.006970524787902832, -0.006728470325469971, -0.006486415863037109, -0.006244361400604248, -0.006002306938171387, -0.005760252475738525, -0.005518198013305664, -0.005276143550872803, -0.005034089088439941, -0.00479203462600708, -0.004549980163574219, -0.004307925701141357, -0.004065871238708496, -0.0038238167762756348, -0.0035817623138427734, -0.003339707851409912, -0.0030976533889770508, -0.0028555989265441895, -0.002613544464111328, -0.002371490001678467, -0.0021294355392456055, -0.0018873810768127441, -0.0016453266143798828, -0.0014032721519470215, -0.0011612176895141602, -0.0009191632270812988, -0.0006771087646484375, -0.00043505430221557617, -0.00019299983978271484, 4.9054622650146484e-05, 0.0002911090850830078, 0.0005331635475158691, 0.0007752180099487305, 0.0010172724723815918, 0.0012593269348144531, 0.0015013813972473145, 0.0017434358596801758, 0.001985490322113037, 0.0022275447845458984, 0.0024695992469787598, 0.002711653709411621, 0.0029537081718444824, 0.0031957626342773438, 0.003437817096710205, 0.0036798715591430664, 0.003921926021575928, 0.004163980484008789, 0.00440603494644165, 0.004648089408874512, 0.004890143871307373, 0.005132198333740234, 0.005374252796173096, 0.005616307258605957, 0.005858361721038818, 0.00610041618347168, 0.006342470645904541, 0.006584525108337402, 0.006826579570770264, 0.007068634033203125]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 4.0, 3.0, 12.0, 9.0, 15.0, 16.0, 26.0, 53.0, 56.0, 95.0, 150.0, 199.0, 317.0, 504.0, 706.0, 1110.0, 1761.0, 2662.0, 4024.0, 6326.0, 10438.0, 16496.0, 27701.0, 47139.0, 83795.0, 153349.0, 305152.0, 711940.0, 1490996.0, 684282.0, 296547.0, 149671.0, 81301.0, 46338.0, 27378.0, 16150.0, 9971.0, 6225.0, 3952.0, 2528.0, 1624.0, 1071.0, 722.0, 485.0, 333.0, 216.0, 150.0, 94.0, 65.0, 43.0, 26.0, 22.0, 16.0, 12.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0], "bins": [-0.01241302490234375, -0.012030839920043945, -0.01164865493774414, -0.011266469955444336, -0.010884284973144531, -0.010502099990844727, -0.010119915008544922, -0.009737730026245117, -0.009355545043945312, -0.008973360061645508, -0.008591175079345703, -0.008208990097045898, -0.007826805114746094, -0.007444620132446289, -0.007062435150146484, -0.00668025016784668, -0.006298065185546875, -0.00591588020324707, -0.005533695220947266, -0.005151510238647461, -0.004769325256347656, -0.0043871402740478516, -0.004004955291748047, -0.003622770309448242, -0.0032405853271484375, -0.002858400344848633, -0.002476215362548828, -0.0020940303802490234, -0.0017118453979492188, -0.001329660415649414, -0.0009474754333496094, -0.0005652904510498047, -0.00018310546875, 0.0001990795135498047, 0.0005812644958496094, 0.0009634494781494141, 0.0013456344604492188, 0.0017278194427490234, 0.002110004425048828, 0.002492189407348633, 0.0028743743896484375, 0.003256559371948242, 0.003638744354248047, 0.0040209293365478516, 0.004403114318847656, 0.004785299301147461, 0.005167484283447266, 0.00554966926574707, 0.005931854248046875, 0.00631403923034668, 0.006696224212646484, 0.007078409194946289, 0.007460594177246094, 0.007842779159545898, 0.008224964141845703, 0.008607149124145508, 0.008989334106445312, 0.009371519088745117, 0.009753704071044922, 0.010135889053344727, 0.010518074035644531, 0.010900259017944336, 0.01128244400024414, 0.011664628982543945, 0.01204681396484375]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 2.0, 8.0, 16.0, 15.0, 9.0, 14.0, 25.0, 29.0, 31.0, 37.0, 65.0, 65.0, 91.0, 120.0, 114.0, 144.0, 154.0, 178.0, 248.0, 275.0, 338.0, 321.0, 269.0, 236.0, 219.0, 202.0, 142.0, 130.0, 116.0, 84.0, 83.0, 59.0, 60.0, 34.0, 38.0, 23.0, 29.0, 6.0, 10.0, 10.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.0042572021484375, -0.004128575325012207, -0.003999948501586914, -0.003871321678161621, -0.003742694854736328, -0.003614068031311035, -0.003485441207885742, -0.0033568143844604492, -0.0032281875610351562, -0.0030995607376098633, -0.0029709339141845703, -0.0028423070907592773, -0.0027136802673339844, -0.0025850534439086914, -0.0024564266204833984, -0.0023277997970581055, -0.0021991729736328125, -0.0020705461502075195, -0.0019419193267822266, -0.0018132925033569336, -0.0016846656799316406, -0.0015560388565063477, -0.0014274120330810547, -0.0012987852096557617, -0.0011701583862304688, -0.0010415315628051758, -0.0009129047393798828, -0.0007842779159545898, -0.0006556510925292969, -0.0005270242691040039, -0.00039839744567871094, -0.00026977062225341797, -0.000141143798828125, -1.2516975402832031e-05, 0.00011610984802246094, 0.0002447366714477539, 0.0003733634948730469, 0.0005019903182983398, 0.0006306171417236328, 0.0007592439651489258, 0.0008878707885742188, 0.0010164976119995117, 0.0011451244354248047, 0.0012737512588500977, 0.0014023780822753906, 0.0015310049057006836, 0.0016596317291259766, 0.0017882585525512695, 0.0019168853759765625, 0.0020455121994018555, 0.0021741390228271484, 0.0023027658462524414, 0.0024313926696777344, 0.0025600194931030273, 0.0026886463165283203, 0.0028172731399536133, 0.0029458999633789062, 0.0030745267868041992, 0.003203153610229492, 0.003331780433654785, 0.003460407257080078, 0.003589034080505371, 0.003717660903930664, 0.003846287727355957, 0.00397491455078125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 4.0, 7.0, 10.0, 8.0, 5.0, 11.0, 10.0, 20.0, 21.0, 26.0, 34.0, 39.0, 29.0, 48.0, 75.0, 85.0, 101.0, 83.0, 70.0, 58.0, 48.0, 40.0, 33.0, 27.0, 15.0, 10.0, 13.0, 15.0, 13.0, 7.0, 9.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010031668469309807, -0.009713997133076191, -0.00939632672816515, -0.009078655391931534, -0.008760984055697918, -0.008443312719464302, -0.00812564231455326, -0.007807970978319645, -0.007490299642086029, -0.0071726287715137005, -0.006854957435280085, -0.006537286564707756, -0.00621961522847414, -0.005901944357901812, -0.005584273487329483, -0.005266602151095867, -0.004948931280523539, -0.00463126040995121, -0.004313589073717594, -0.003995918203145266, -0.0036782468669116497, -0.003360575996339321, -0.003042904892936349, -0.0027252337895333767, -0.0024075626861304045, -0.0020898915827274323, -0.00177222047932446, -0.0014545494923368096, -0.0011368783889338374, -0.0008192072855308652, -0.0005015362985432148, -0.00018386519514024258, 0.00013380590826272964, 0.0004514769825618714, 0.0007691480568610132, 0.0010868191020563245, 0.0014044902054592967, 0.001722161308862269, 0.0020398322958499193, 0.0023575033992528915, 0.0026751745026558638, 0.002992845606058836, 0.003310516709461808, 0.0036281878128647804, 0.003945858683437109, 0.004263530019670725, 0.0045812008902430534, 0.004898872226476669, 0.005216543097048998, 0.0055342139676213264, 0.005851885303854942, 0.006169556174427271, 0.006487227510660887, 0.006804898381233215, 0.007122569717466831, 0.00744024058803916, 0.007757911458611488, 0.008075582794845104, 0.008393253199756145, 0.008710924535989761, 0.009028595872223377, 0.009346267208456993, 0.009663937613368034, 0.00998160894960165, 0.010299280285835266]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 6.0, 12.0, 6.0, 8.0, 16.0, 10.0, 8.0, 23.0, 23.0, 22.0, 28.0, 30.0, 28.0, 41.0, 35.0, 38.0, 42.0, 49.0, 45.0, 40.0, 39.0, 39.0, 49.0, 45.0, 42.0, 36.0, 30.0, 22.0, 25.0, 26.0, 17.0, 17.0, 22.0, 20.0, 14.0, 13.0, 10.0, 10.0, 3.0, 3.0, 3.0, 1.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.007902451790869236, -0.007644967176020145, -0.007387482561171055, -0.007129997480660677, -0.006872512865811586, -0.006615028250962496, -0.006357543170452118, -0.006100058555603027, -0.005842573940753937, -0.005585089325904846, -0.005327604711055756, -0.005070119630545378, -0.004812635015696287, -0.004555150400847197, -0.004297665320336819, -0.004040180705487728, -0.0037826960906386375, -0.003525211475789547, -0.0032677266281098127, -0.0030102417804300785, -0.002752757165580988, -0.0024952725507318974, -0.002237787703052163, -0.001980302855372429, -0.0017228182405233383, -0.001465333509258926, -0.0012078487779945135, -0.0009503640467301011, -0.0006928793154656887, -0.0004353945842012763, -0.0001779098529368639, 7.95748783275485e-05, 0.0003370605409145355, 0.0005945452721789479, 0.0008520300034433603, 0.0011095147347077727, 0.0013669994659721851, 0.0016244841972365975, 0.00188196892850101, 0.002139453776180744, 0.0023969383910298347, 0.0026544230058789253, 0.0029119078535586596, 0.003169392701238394, 0.0034268773160874844, 0.003684361930936575, 0.003941847011446953, 0.004199331626296043, 0.004456816241145134, 0.0047143008559942245, 0.004971785470843315, 0.005229270551353693, 0.005486755166202784, 0.005744239781051874, 0.006001724861562252, 0.006259209476411343, 0.006516694091260433, 0.006774178706109524, 0.007031663320958614, 0.007289148401468992, 0.007546633016318083, 0.007804117631167173, 0.008061602711677551, 0.008319087326526642, 0.008576571941375732]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 7.0, 5.0, 17.0, 14.0, 23.0, 22.0, 33.0, 50.0, 84.0, 128.0, 167.0, 259.0, 359.0, 577.0, 888.0, 1436.0, 2246.0, 3549.0, 5985.0, 9950.0, 17608.0, 32589.0, 64704.0, 150148.0, 342849.0, 225694.0, 90672.0, 43356.0, 22969.0, 12619.0, 7283.0, 4476.0, 2777.0, 1749.0, 1138.0, 701.0, 485.0, 298.0, 222.0, 133.0, 100.0, 62.0, 39.0, 32.0, 18.0, 12.0, 8.0, 7.0, 4.0, 3.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0057525634765625, -0.005571186542510986, -0.005389809608459473, -0.005208432674407959, -0.005027055740356445, -0.004845678806304932, -0.004664301872253418, -0.004482924938201904, -0.004301548004150391, -0.004120171070098877, -0.003938794136047363, -0.0037574172019958496, -0.003576040267944336, -0.0033946633338928223, -0.0032132863998413086, -0.003031909465789795, -0.0028505325317382812, -0.0026691555976867676, -0.002487778663635254, -0.0023064017295837402, -0.0021250247955322266, -0.0019436478614807129, -0.0017622709274291992, -0.0015808939933776855, -0.0013995170593261719, -0.0012181401252746582, -0.0010367631912231445, -0.0008553862571716309, -0.0006740093231201172, -0.0004926323890686035, -0.00031125545501708984, -0.00012987852096557617, 5.14984130859375e-05, 0.00023287534713745117, 0.00041425228118896484, 0.0005956292152404785, 0.0007770061492919922, 0.0009583830833435059, 0.0011397600173950195, 0.0013211369514465332, 0.0015025138854980469, 0.0016838908195495605, 0.0018652677536010742, 0.002046644687652588, 0.0022280216217041016, 0.0024093985557556152, 0.002590775489807129, 0.0027721524238586426, 0.0029535293579101562, 0.00313490629196167, 0.0033162832260131836, 0.0034976601600646973, 0.003679037094116211, 0.0038604140281677246, 0.004041790962219238, 0.004223167896270752, 0.004404544830322266, 0.004585921764373779, 0.004767298698425293, 0.004948675632476807, 0.00513005256652832, 0.005311429500579834, 0.005492806434631348, 0.005674183368682861, 0.005855560302734375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 6.0, 3.0, 7.0, 9.0, 11.0, 13.0, 17.0, 15.0, 25.0, 18.0, 29.0, 28.0, 44.0, 29.0, 40.0, 39.0, 38.0, 49.0, 48.0, 32.0, 52.0, 52.0, 50.0, 43.0, 39.0, 43.0, 30.0, 25.0, 21.0, 26.0, 14.0, 23.0, 19.0, 17.0, 15.0, 13.0, 4.0, 7.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.0085296630859375, -0.008252501487731934, -0.007975339889526367, -0.007698178291320801, -0.007421016693115234, -0.007143855094909668, -0.0068666934967041016, -0.006589531898498535, -0.006312370300292969, -0.006035208702087402, -0.005758047103881836, -0.0054808855056762695, -0.005203723907470703, -0.004926562309265137, -0.00464940071105957, -0.004372239112854004, -0.0040950775146484375, -0.003817915916442871, -0.0035407543182373047, -0.0032635927200317383, -0.002986431121826172, -0.0027092695236206055, -0.002432107925415039, -0.0021549463272094727, -0.0018777847290039062, -0.0016006231307983398, -0.0013234615325927734, -0.001046299934387207, -0.0007691383361816406, -0.0004919767379760742, -0.0002148151397705078, 6.23464584350586e-05, 0.000339508056640625, 0.0006166696548461914, 0.0008938312530517578, 0.0011709928512573242, 0.0014481544494628906, 0.001725316047668457, 0.0020024776458740234, 0.00227963924407959, 0.0025568008422851562, 0.0028339624404907227, 0.003111124038696289, 0.0033882856369018555, 0.003665447235107422, 0.003942608833312988, 0.004219770431518555, 0.004496932029724121, 0.0047740936279296875, 0.005051255226135254, 0.00532841682434082, 0.005605578422546387, 0.005882740020751953, 0.0061599016189575195, 0.006437063217163086, 0.006714224815368652, 0.006991386413574219, 0.007268548011779785, 0.0075457096099853516, 0.007822871208190918, 0.008100032806396484, 0.00837719440460205, 0.008654356002807617, 0.008931517601013184, 0.00920867919921875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 6.0, 5.0, 8.0, 5.0, 4.0, 23.0, 28.0, 24.0, 37.0, 59.0, 76.0, 105.0, 149.0, 197.0, 271.0, 386.0, 594.0, 829.0, 1192.0, 1900.0, 2764.0, 4473.0, 7305.0, 13544.0, 30037.0, 87617.0, 453499.0, 318253.0, 69315.0, 25142.0, 12026.0, 6581.0, 4062.0, 2501.0, 1702.0, 1208.0, 782.0, 571.0, 344.0, 282.0, 189.0, 120.0, 105.0, 71.0, 47.0, 43.0, 29.0, 14.0, 6.0, 6.0, 5.0, 7.0, 3.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.008331298828125, -0.008052706718444824, -0.0077741146087646484, -0.007495522499084473, -0.007216930389404297, -0.006938338279724121, -0.006659746170043945, -0.0063811540603637695, -0.006102561950683594, -0.005823969841003418, -0.005545377731323242, -0.005266785621643066, -0.004988193511962891, -0.004709601402282715, -0.004431009292602539, -0.004152417182922363, -0.0038738250732421875, -0.0035952329635620117, -0.003316640853881836, -0.00303804874420166, -0.0027594566345214844, -0.0024808645248413086, -0.002202272415161133, -0.001923680305480957, -0.0016450881958007812, -0.0013664960861206055, -0.0010879039764404297, -0.0008093118667602539, -0.0005307197570800781, -0.00025212764739990234, 2.6464462280273438e-05, 0.0003050565719604492, 0.000583648681640625, 0.0008622407913208008, 0.0011408329010009766, 0.0014194250106811523, 0.0016980171203613281, 0.001976609230041504, 0.0022552013397216797, 0.0025337934494018555, 0.0028123855590820312, 0.003090977668762207, 0.003369569778442383, 0.0036481618881225586, 0.003926753997802734, 0.00420534610748291, 0.004483938217163086, 0.004762530326843262, 0.0050411224365234375, 0.005319714546203613, 0.005598306655883789, 0.005876898765563965, 0.006155490875244141, 0.006434082984924316, 0.006712675094604492, 0.006991267204284668, 0.007269859313964844, 0.0075484514236450195, 0.007827043533325195, 0.008105635643005371, 0.008384227752685547, 0.008662819862365723, 0.008941411972045898, 0.009220004081726074, 0.00949859619140625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 3.0, 5.0, 5.0, 3.0, 7.0, 4.0, 9.0, 21.0, 12.0, 13.0, 23.0, 20.0, 28.0, 33.0, 30.0, 34.0, 38.0, 49.0, 36.0, 41.0, 45.0, 54.0, 35.0, 37.0, 34.0, 38.0, 28.0, 38.0, 29.0, 33.0, 31.0, 23.0, 34.0, 21.0, 18.0, 17.0, 11.0, 10.0, 10.0, 4.0, 9.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00572967529296875, -0.005566835403442383, -0.005403995513916016, -0.0052411556243896484, -0.005078315734863281, -0.004915475845336914, -0.004752635955810547, -0.00458979606628418, -0.0044269561767578125, -0.004264116287231445, -0.004101276397705078, -0.003938436508178711, -0.0037755966186523438, -0.0036127567291259766, -0.0034499168395996094, -0.003287076950073242, -0.003124237060546875, -0.002961397171020508, -0.0027985572814941406, -0.0026357173919677734, -0.0024728775024414062, -0.002310037612915039, -0.002147197723388672, -0.0019843578338623047, -0.0018215179443359375, -0.0016586780548095703, -0.0014958381652832031, -0.001332998275756836, -0.0011701583862304688, -0.0010073184967041016, -0.0008444786071777344, -0.0006816387176513672, -0.000518798828125, -0.0003559589385986328, -0.00019311904907226562, -3.0279159545898438e-05, 0.00013256072998046875, 0.00029540061950683594, 0.0004582405090332031, 0.0006210803985595703, 0.0007839202880859375, 0.0009467601776123047, 0.0011096000671386719, 0.001272439956665039, 0.0014352798461914062, 0.0015981197357177734, 0.0017609596252441406, 0.0019237995147705078, 0.002086639404296875, 0.002249479293823242, 0.0024123191833496094, 0.0025751590728759766, 0.0027379989624023438, 0.002900838851928711, 0.003063678741455078, 0.0032265186309814453, 0.0033893585205078125, 0.0035521984100341797, 0.003715038299560547, 0.003877878189086914, 0.004040718078613281, 0.0042035579681396484, 0.004366397857666016, 0.004529237747192383, 0.00469207763671875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 8.0, 5.0, 8.0, 12.0, 18.0, 29.0, 28.0, 38.0, 60.0, 71.0, 100.0, 140.0, 183.0, 243.0, 384.0, 575.0, 830.0, 1323.0, 2052.0, 3206.0, 5717.0, 10481.0, 22319.0, 63304.0, 515852.0, 324691.0, 53418.0, 19911.0, 9707.0, 5056.0, 2962.0, 1873.0, 1199.0, 806.0, 555.0, 362.0, 312.0, 190.0, 143.0, 113.0, 65.0, 54.0, 50.0, 26.0, 26.0, 12.0, 11.0, 10.0, 9.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.0007338523864746094, -0.0007122233510017395, -0.0006905943155288696, -0.0006689652800559998, -0.0006473362445831299, -0.00062570720911026, -0.0006040781736373901, -0.0005824491381645203, -0.0005608201026916504, -0.0005391910672187805, -0.0005175620317459106, -0.0004959329962730408, -0.0004743039608001709, -0.000452674925327301, -0.00043104588985443115, -0.0004094168543815613, -0.0003877878189086914, -0.00036615878343582153, -0.00034452974796295166, -0.0003229007124900818, -0.0003012716770172119, -0.00027964264154434204, -0.00025801360607147217, -0.0002363845705986023, -0.00021475553512573242, -0.00019312649965286255, -0.00017149746417999268, -0.0001498684287071228, -0.00012823939323425293, -0.00010661035776138306, -8.498132228851318e-05, -6.335228681564331e-05, -4.172325134277344e-05, -2.0094215869903564e-05, 1.5348196029663086e-06, 2.316385507583618e-05, 4.4792890548706055e-05, 6.642192602157593e-05, 8.80509614944458e-05, 0.00010967999696731567, 0.00013130903244018555, 0.00015293806791305542, 0.0001745671033859253, 0.00019619613885879517, 0.00021782517433166504, 0.0002394542098045349, 0.0002610832452774048, 0.00028271228075027466, 0.00030434131622314453, 0.0003259703516960144, 0.0003475993871688843, 0.00036922842264175415, 0.000390857458114624, 0.0004124864935874939, 0.00043411552906036377, 0.00045574456453323364, 0.0004773736000061035, 0.0004990026354789734, 0.0005206316709518433, 0.0005422607064247131, 0.000563889741897583, 0.0005855187773704529, 0.0006071478128433228, 0.0006287768483161926, 0.0006504058837890625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 3.0, 8.0, 12.0, 14.0, 11.0, 12.0, 30.0, 0.0, 37.0, 53.0, 83.0, 87.0, 92.0, 114.0, 93.0, 78.0, 77.0, 53.0, 42.0, 30.0, 21.0, 15.0, 7.0, 0.0, 5.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.086162567138672e-06, -2.030283212661743e-06, -1.9744038581848145e-06, -1.9185245037078857e-06, -1.862645149230957e-06, -1.8067657947540283e-06, -1.7508864402770996e-06, -1.695007085800171e-06, -1.6391277313232422e-06, -1.5832483768463135e-06, -1.5273690223693848e-06, -1.471489667892456e-06, -1.4156103134155273e-06, -1.3597309589385986e-06, -1.30385160446167e-06, -1.2479722499847412e-06, -1.1920928955078125e-06, -1.1362135410308838e-06, -1.080334186553955e-06, -1.0244548320770264e-06, -9.685754776000977e-07, -9.126961231231689e-07, -8.568167686462402e-07, -8.009374141693115e-07, -7.450580596923828e-07, -6.891787052154541e-07, -6.332993507385254e-07, -5.774199962615967e-07, -5.21540641784668e-07, -4.6566128730773926e-07, -4.0978193283081055e-07, -3.5390257835388184e-07, -2.980232238769531e-07, -2.421438694000244e-07, -1.862645149230957e-07, -1.30385160446167e-07, -7.450580596923828e-08, -1.862645149230957e-08, 3.725290298461914e-08, 9.313225746154785e-08, 1.4901161193847656e-07, 2.0489096641540527e-07, 2.60770320892334e-07, 3.166496753692627e-07, 3.725290298461914e-07, 4.284083843231201e-07, 4.842877388000488e-07, 5.401670932769775e-07, 5.960464477539062e-07, 6.51925802230835e-07, 7.078051567077637e-07, 7.636845111846924e-07, 8.195638656616211e-07, 8.754432201385498e-07, 9.313225746154785e-07, 9.872019290924072e-07, 1.043081283569336e-06, 1.0989606380462646e-06, 1.1548399925231934e-06, 1.210719347000122e-06, 1.2665987014770508e-06, 1.3224780559539795e-06, 1.3783574104309082e-06, 1.434236764907837e-06, 1.4901161193847656e-06]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 3.0, 14.0, 11.0, 18.0, 16.0, 44.0, 51.0, 69.0, 116.0, 168.0, 216.0, 331.0, 565.0, 913.0, 1410.0, 2364.0, 3931.0, 7404.0, 13956.0, 30573.0, 84982.0, 462053.0, 315058.0, 69447.0, 26402.0, 12477.0, 6523.0, 3701.0, 2106.0, 1323.0, 801.0, 514.0, 344.0, 195.0, 131.0, 84.0, 75.0, 42.0, 30.0, 29.0, 19.0, 21.0, 15.0, 7.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000881195068359375, -0.0008526891469955444, -0.0008241832256317139, -0.0007956773042678833, -0.0007671713829040527, -0.0007386654615402222, -0.0007101595401763916, -0.000681653618812561, -0.0006531476974487305, -0.0006246417760848999, -0.0005961358547210693, -0.0005676299333572388, -0.0005391240119934082, -0.0005106180906295776, -0.00048211216926574707, -0.0004536062479019165, -0.00042510032653808594, -0.00039659440517425537, -0.0003680884838104248, -0.00033958256244659424, -0.00031107664108276367, -0.0002825707197189331, -0.00025406479835510254, -0.00022555887699127197, -0.0001970529556274414, -0.00016854703426361084, -0.00014004111289978027, -0.00011153519153594971, -8.302927017211914e-05, -5.4523348808288574e-05, -2.6017427444458008e-05, 2.4884939193725586e-06, 3.0994415283203125e-05, 5.950033664703369e-05, 8.800625801086426e-05, 0.00011651217937469482, 0.0001450181007385254, 0.00017352402210235596, 0.00020202994346618652, 0.0002305358648300171, 0.00025904178619384766, 0.0002875477075576782, 0.0003160536289215088, 0.00034455955028533936, 0.0003730654716491699, 0.0004015713930130005, 0.00043007731437683105, 0.0004585832357406616, 0.0004870891571044922, 0.0005155950784683228, 0.0005441009998321533, 0.0005726069211959839, 0.0006011128425598145, 0.000629618763923645, 0.0006581246852874756, 0.0006866306066513062, 0.0007151365280151367, 0.0007436424493789673, 0.0007721483707427979, 0.0008006542921066284, 0.000829160213470459, 0.0008576661348342896, 0.0008861720561981201, 0.0009146779775619507, 0.0009431838989257812]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 4.0, 2.0, 8.0, 6.0, 12.0, 10.0, 16.0, 12.0, 29.0, 21.0, 41.0, 54.0, 67.0, 72.0, 125.0, 153.0, 85.0, 46.0, 54.0, 42.0, 33.0, 18.0, 17.0, 9.0, 15.0, 9.0, 7.0, 4.0, 6.0, 5.0, 2.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00026988983154296875, -0.0002629850059747696, -0.00025608018040657043, -0.0002491753548383713, -0.00024227052927017212, -0.00023536570370197296, -0.0002284608781337738, -0.00022155605256557465, -0.0002146512269973755, -0.00020774640142917633, -0.00020084157586097717, -0.00019393675029277802, -0.00018703192472457886, -0.0001801270991563797, -0.00017322227358818054, -0.00016631744801998138, -0.00015941262245178223, -0.00015250779688358307, -0.0001456029713153839, -0.00013869814574718475, -0.0001317933201789856, -0.00012488849461078644, -0.00011798366904258728, -0.00011107884347438812, -0.00010417401790618896, -9.726919233798981e-05, -9.036436676979065e-05, -8.345954120159149e-05, -7.655471563339233e-05, -6.964989006519318e-05, -6.274506449699402e-05, -5.584023892879486e-05, -4.89354133605957e-05, -4.2030587792396545e-05, -3.512576222419739e-05, -2.822093665599823e-05, -2.1316111087799072e-05, -1.4411285519599915e-05, -7.506459951400757e-06, -6.016343832015991e-07, 6.303191184997559e-06, 1.3208016753196716e-05, 2.0112842321395874e-05, 2.7017667889595032e-05, 3.392249345779419e-05, 4.082731902599335e-05, 4.7732144594192505e-05, 5.463697016239166e-05, 6.154179573059082e-05, 6.844662129878998e-05, 7.535144686698914e-05, 8.22562724351883e-05, 8.916109800338745e-05, 9.606592357158661e-05, 0.00010297074913978577, 0.00010987557470798492, 0.00011678040027618408, 0.00012368522584438324, 0.0001305900514125824, 0.00013749487698078156, 0.0001443997025489807, 0.00015130452811717987, 0.00015820935368537903, 0.00016511417925357819, 0.00017201900482177734]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 6.0, 3.0, 4.0, 3.0, 9.0, 7.0, 8.0, 10.0, 9.0, 10.0, 25.0, 20.0, 37.0, 24.0, 33.0, 45.0, 58.0, 79.0, 89.0, 105.0, 75.0, 74.0, 48.0, 47.0, 40.0, 24.0, 16.0, 18.0, 14.0, 14.0, 12.0, 4.0, 6.0, 6.0, 7.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010334598831832409, -0.010013062506914139, -0.009691527113318443, -0.009369990788400173, -0.009048455394804478, -0.008726919069886208, -0.008405383676290512, -0.008083847351372242, -0.007762311492115259, -0.007440775632858276, -0.0071192397736012936, -0.006797703914344311, -0.006476167589426041, -0.006154632195830345, -0.005833095870912075, -0.005511560011655092, -0.0051900241523981094, -0.004868488293141127, -0.004546952433884144, -0.004225416574627161, -0.0039038804825395346, -0.0035823446232825518, -0.0032608085311949253, -0.0029392726719379425, -0.0026177368126809597, -0.002296200953423977, -0.001974665094166994, -0.0016531290020793676, -0.0013315931428223848, -0.001010057283565402, -0.0006885213078930974, -0.00036698533222079277, -4.544854164123535e-05, 0.00027608737582340837, 0.0005976232932880521, 0.0009191592107526958, 0.0012406951282173395, 0.0015622309874743223, 0.001883766963146627, 0.0022053029388189316, 0.0025268387980759144, 0.002848374657332897, 0.00316991051658988, 0.0034914466086775064, 0.0038129824679344893, 0.004134518094360828, 0.0044560544192790985, 0.004777590278536081, 0.005099126137793064, 0.005420661997050047, 0.00574219785630703, 0.0060637337155640125, 0.006385269574820995, 0.0067068058997392654, 0.007028341758996248, 0.007349877618253231, 0.007671413477510214, 0.007992949336767197, 0.008314485661685467, 0.008636021055281162, 0.008957557380199432, 0.009279092773795128, 0.009600629098713398, 0.009922165423631668, 0.010243700817227364]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 9.0, 9.0, 7.0, 8.0, 16.0, 10.0, 8.0, 26.0, 23.0, 18.0, 28.0, 28.0, 30.0, 39.0, 37.0, 38.0, 44.0, 47.0, 43.0, 41.0, 38.0, 44.0, 48.0, 41.0, 42.0, 41.0, 26.0, 23.0, 24.0, 22.0, 20.0, 18.0, 21.0, 21.0, 16.0, 11.0, 10.0, 10.0, 4.0, 3.0, 3.0, 1.0, 2.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.007877729833126068, -0.007622381206601858, -0.007367032114416361, -0.007111683487892151, -0.006856334861367941, -0.006600986234843731, -0.006345637142658234, -0.006090288516134024, -0.005834939889609814, -0.005579591263085604, -0.005324242170900106, -0.0050688935443758965, -0.0048135449178516865, -0.0045581962913274765, -0.004302847199141979, -0.004047498572617769, -0.003792149480432272, -0.0035368006210774183, -0.0032814519945532084, -0.0030261031351983547, -0.0027707545086741447, -0.002515405649319291, -0.0022600567899644375, -0.0020047081634402275, -0.0017493593040853739, -0.001494010561145842, -0.0012386618182063103, -0.0009833129588514566, -0.0007279642159119248, -0.00047261547297239304, -0.0002172666136175394, 3.80821293219924e-05, 0.0002934308722615242, 0.000548779615201056, 0.0008041284163482487, 0.0010594772174954414, 0.0013148259604349732, 0.001570174703374505, 0.0018255235627293587, 0.0020808721892535686, 0.0023362210486084223, 0.002591569907963276, 0.002846918534487486, 0.0031022673938423395, 0.003357616253197193, 0.003612964879721403, 0.0038683137390762568, 0.00412366259843111, 0.00437901122495532, 0.00463435985147953, 0.004889708943665028, 0.005145057570189238, 0.005400406196713448, 0.005655755288898945, 0.005911103915423155, 0.006166452541947365, 0.006421801634132862, 0.006677150260657072, 0.006932499352842569, 0.007187847979366779, 0.007443196605890989, 0.007698545232415199, 0.007953894324600697, 0.008209243416786194, 0.008464591577649117]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 6.0, 12.0, 12.0, 26.0, 32.0, 44.0, 58.0, 89.0, 137.0, 185.0, 291.0, 403.0, 614.0, 978.0, 1524.0, 2314.0, 3593.0, 5641.0, 8638.0, 13768.0, 21813.0, 35690.0, 61819.0, 117708.0, 248873.0, 248533.0, 117402.0, 61999.0, 36089.0, 22112.0, 13579.0, 8629.0, 5616.0, 3546.0, 2336.0, 1525.0, 1022.0, 665.0, 390.0, 279.0, 160.0, 126.0, 89.0, 64.0, 37.0, 31.0, 17.0, 17.0, 11.0, 3.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.0160675048828125, -0.01556539535522461, -0.015063285827636719, -0.014561176300048828, -0.014059066772460938, -0.013556957244873047, -0.013054847717285156, -0.012552738189697266, -0.012050628662109375, -0.011548519134521484, -0.011046409606933594, -0.010544300079345703, -0.010042190551757812, -0.009540081024169922, -0.009037971496582031, -0.00853586196899414, -0.00803375244140625, -0.007531642913818359, -0.007029533386230469, -0.006527423858642578, -0.0060253143310546875, -0.005523204803466797, -0.005021095275878906, -0.004518985748291016, -0.004016876220703125, -0.0035147666931152344, -0.0030126571655273438, -0.002510547637939453, -0.0020084381103515625, -0.0015063285827636719, -0.0010042190551757812, -0.0005021095275878906, 0.0, 0.0005021095275878906, 0.0010042190551757812, 0.0015063285827636719, 0.0020084381103515625, 0.002510547637939453, 0.0030126571655273438, 0.0035147666931152344, 0.004016876220703125, 0.004518985748291016, 0.005021095275878906, 0.005523204803466797, 0.0060253143310546875, 0.006527423858642578, 0.007029533386230469, 0.007531642913818359, 0.00803375244140625, 0.00853586196899414, 0.009037971496582031, 0.009540081024169922, 0.010042190551757812, 0.010544300079345703, 0.011046409606933594, 0.011548519134521484, 0.012050628662109375, 0.012552738189697266, 0.013054847717285156, 0.013556957244873047, 0.014059066772460938, 0.014561176300048828, 0.015063285827636719, 0.01556539535522461, 0.0160675048828125]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 11.0, 7.0, 12.0, 10.0, 12.0, 18.0, 27.0, 23.0, 21.0, 28.0, 42.0, 47.0, 27.0, 35.0, 40.0, 50.0, 45.0, 44.0, 53.0, 53.0, 55.0, 38.0, 34.0, 38.0, 27.0, 26.0, 28.0, 19.0, 15.0, 19.0, 22.0, 20.0, 17.0, 10.0, 7.0, 9.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.007099151611328125, -0.006860554218292236, -0.006621956825256348, -0.006383359432220459, -0.00614476203918457, -0.005906164646148682, -0.005667567253112793, -0.005428969860076904, -0.005190372467041016, -0.004951775074005127, -0.004713177680969238, -0.00447458028793335, -0.004235982894897461, -0.003997385501861572, -0.0037587881088256836, -0.003520190715789795, -0.0032815933227539062, -0.0030429959297180176, -0.002804398536682129, -0.0025658011436462402, -0.0023272037506103516, -0.002088606357574463, -0.0018500089645385742, -0.0016114115715026855, -0.0013728141784667969, -0.0011342167854309082, -0.0008956193923950195, -0.0006570219993591309, -0.0004184246063232422, -0.00017982721328735352, 5.8770179748535156e-05, 0.00029736757278442383, 0.0005359649658203125, 0.0007745623588562012, 0.0010131597518920898, 0.0012517571449279785, 0.0014903545379638672, 0.0017289519309997559, 0.0019675493240356445, 0.002206146717071533, 0.002444744110107422, 0.0026833415031433105, 0.0029219388961791992, 0.003160536289215088, 0.0033991336822509766, 0.0036377310752868652, 0.003876328468322754, 0.004114925861358643, 0.004353523254394531, 0.00459212064743042, 0.004830718040466309, 0.005069315433502197, 0.005307912826538086, 0.005546510219573975, 0.005785107612609863, 0.006023705005645752, 0.006262302398681641, 0.006500899791717529, 0.006739497184753418, 0.006978094577789307, 0.007216691970825195, 0.007455289363861084, 0.007693886756896973, 0.007932484149932861, 0.00817108154296875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 6.0, 8.0, 19.0, 23.0, 26.0, 63.0, 80.0, 120.0, 167.0, 253.0, 378.0, 551.0, 858.0, 1280.0, 1964.0, 2961.0, 4474.0, 7125.0, 11271.0, 18234.0, 29622.0, 50643.0, 89317.0, 176132.0, 289223.0, 159768.0, 82692.0, 46905.0, 27647.0, 17020.0, 10529.0, 6779.0, 4219.0, 2810.0, 1804.0, 1193.0, 789.0, 494.0, 380.0, 238.0, 151.0, 120.0, 70.0, 65.0, 30.0, 19.0, 16.0, 8.0, 6.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0139923095703125, -0.013532519340515137, -0.013072729110717773, -0.01261293888092041, -0.012153148651123047, -0.011693358421325684, -0.01123356819152832, -0.010773777961730957, -0.010313987731933594, -0.00985419750213623, -0.009394407272338867, -0.008934617042541504, -0.00847482681274414, -0.008015036582946777, -0.007555246353149414, -0.007095456123352051, -0.0066356658935546875, -0.006175875663757324, -0.005716085433959961, -0.005256295204162598, -0.004796504974365234, -0.004336714744567871, -0.003876924514770508, -0.0034171342849731445, -0.0029573440551757812, -0.002497553825378418, -0.0020377635955810547, -0.0015779733657836914, -0.0011181831359863281, -0.0006583929061889648, -0.00019860267639160156, 0.0002611875534057617, 0.000720977783203125, 0.0011807680130004883, 0.0016405582427978516, 0.002100348472595215, 0.002560138702392578, 0.0030199289321899414, 0.0034797191619873047, 0.003939509391784668, 0.004399299621582031, 0.0048590898513793945, 0.005318880081176758, 0.005778670310974121, 0.006238460540771484, 0.006698250770568848, 0.007158041000366211, 0.007617831230163574, 0.008077621459960938, 0.0085374116897583, 0.008997201919555664, 0.009456992149353027, 0.00991678237915039, 0.010376572608947754, 0.010836362838745117, 0.01129615306854248, 0.011755943298339844, 0.012215733528137207, 0.01267552375793457, 0.013135313987731934, 0.013595104217529297, 0.01405489444732666, 0.014514684677124023, 0.014974474906921387, 0.01543426513671875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 8.0, 4.0, 10.0, 15.0, 11.0, 12.0, 19.0, 34.0, 21.0, 23.0, 32.0, 31.0, 28.0, 41.0, 39.0, 35.0, 52.0, 41.0, 54.0, 42.0, 38.0, 33.0, 36.0, 47.0, 31.0, 31.0, 30.0, 33.0, 19.0, 22.0, 19.0, 21.0, 12.0, 17.0, 12.0, 6.0, 5.0, 8.0, 5.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.004779815673828125, -0.004640460014343262, -0.0045011043548583984, -0.004361748695373535, -0.004222393035888672, -0.004083037376403809, -0.003943681716918945, -0.003804326057434082, -0.0036649703979492188, -0.0035256147384643555, -0.003386259078979492, -0.003246903419494629, -0.0031075477600097656, -0.0029681921005249023, -0.002828836441040039, -0.0026894807815551758, -0.0025501251220703125, -0.0024107694625854492, -0.002271413803100586, -0.0021320581436157227, -0.0019927024841308594, -0.001853346824645996, -0.0017139911651611328, -0.0015746355056762695, -0.0014352798461914062, -0.001295924186706543, -0.0011565685272216797, -0.0010172128677368164, -0.0008778572082519531, -0.0007385015487670898, -0.0005991458892822266, -0.0004597902297973633, -0.0003204345703125, -0.00018107891082763672, -4.172325134277344e-05, 9.763240814208984e-05, 0.00023698806762695312, 0.0003763437271118164, 0.0005156993865966797, 0.000655055046081543, 0.0007944107055664062, 0.0009337663650512695, 0.0010731220245361328, 0.001212477684020996, 0.0013518333435058594, 0.0014911890029907227, 0.001630544662475586, 0.0017699003219604492, 0.0019092559814453125, 0.0020486116409301758, 0.002187967300415039, 0.0023273229598999023, 0.0024666786193847656, 0.002606034278869629, 0.002745389938354492, 0.0028847455978393555, 0.0030241012573242188, 0.003163456916809082, 0.0033028125762939453, 0.0034421682357788086, 0.003581523895263672, 0.003720879554748535, 0.0038602352142333984, 0.003999590873718262, 0.004138946533203125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 8.0, 9.0, 6.0, 15.0, 20.0, 24.0, 42.0, 39.0, 45.0, 49.0, 84.0, 75.0, 110.0, 141.0, 148.0, 213.0, 268.0, 351.0, 463.0, 695.0, 1012.0, 1673.0, 2646.0, 4615.0, 9325.0, 23644.0, 134281.0, 807013.0, 34527.0, 11953.0, 5817.0, 3113.0, 1871.0, 1181.0, 755.0, 573.0, 381.0, 295.0, 244.0, 170.0, 138.0, 99.0, 116.0, 63.0, 50.0, 45.0, 40.0, 29.0, 26.0, 13.0, 9.0, 16.0, 8.0, 5.0, 3.0, 4.0, 1.0, 8.0], "bins": [-0.0013828277587890625, -0.001341119408607483, -0.0012994110584259033, -0.0012577027082443237, -0.0012159943580627441, -0.0011742860078811646, -0.001132577657699585, -0.0010908693075180054, -0.0010491609573364258, -0.0010074526071548462, -0.0009657442569732666, -0.000924035906791687, -0.0008823275566101074, -0.0008406192064285278, -0.0007989108562469482, -0.0007572025060653687, -0.0007154941558837891, -0.0006737858057022095, -0.0006320774555206299, -0.0005903691053390503, -0.0005486607551574707, -0.0005069524049758911, -0.0004652440547943115, -0.00042353570461273193, -0.00038182735443115234, -0.00034011900424957275, -0.00029841065406799316, -0.0002567023038864136, -0.00021499395370483398, -0.0001732856035232544, -0.0001315772533416748, -8.986890316009521e-05, -4.8160552978515625e-05, -6.452202796936035e-06, 3.5256147384643555e-05, 7.696449756622314e-05, 0.00011867284774780273, 0.00016038119792938232, 0.00020208954811096191, 0.0002437978982925415, 0.0002855062484741211, 0.0003272145986557007, 0.0003689229488372803, 0.00041063129901885986, 0.00045233964920043945, 0.000494047999382019, 0.0005357563495635986, 0.0005774646997451782, 0.0006191730499267578, 0.0006608814001083374, 0.000702589750289917, 0.0007442981004714966, 0.0007860064506530762, 0.0008277148008346558, 0.0008694231510162354, 0.0009111315011978149, 0.0009528398513793945, 0.0009945482015609741, 0.0010362565517425537, 0.0010779649019241333, 0.0011196732521057129, 0.0011613816022872925, 0.001203089952468872, 0.0012447983026504517, 0.0012865066528320312]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 14.0, 0.0, 34.0, 0.0, 0.0, 54.0, 0.0, 81.0, 0.0, 137.0, 0.0, 0.0, 384.0, 0.0, 130.0, 0.0, 86.0, 0.0, 0.0, 33.0, 0.0, 24.0, 0.0, 0.0, 19.0, 0.0, 7.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.344650268554688e-07, -8.093193173408508e-07, -7.841736078262329e-07, -7.59027898311615e-07, -7.338821887969971e-07, -7.087364792823792e-07, -6.835907697677612e-07, -6.584450602531433e-07, -6.332993507385254e-07, -6.081536412239075e-07, -5.830079317092896e-07, -5.578622221946716e-07, -5.327165126800537e-07, -5.075708031654358e-07, -4.824250936508179e-07, -4.5727938413619995e-07, -4.3213367462158203e-07, -4.069879651069641e-07, -3.818422555923462e-07, -3.5669654607772827e-07, -3.3155083656311035e-07, -3.0640512704849243e-07, -2.812594175338745e-07, -2.561137080192566e-07, -2.3096799850463867e-07, -2.0582228899002075e-07, -1.8067657947540283e-07, -1.555308699607849e-07, -1.30385160446167e-07, -1.0523945093154907e-07, -8.009374141693115e-08, -5.494803190231323e-08, -2.9802322387695312e-08, -4.6566128730773926e-09, 2.0489096641540527e-08, 4.563480615615845e-08, 7.078051567077637e-08, 9.592622518539429e-08, 1.210719347000122e-07, 1.4621764421463013e-07, 1.7136335372924805e-07, 1.9650906324386597e-07, 2.2165477275848389e-07, 2.468004822731018e-07, 2.7194619178771973e-07, 2.9709190130233765e-07, 3.2223761081695557e-07, 3.473833203315735e-07, 3.725290298461914e-07, 3.976747393608093e-07, 4.2282044887542725e-07, 4.4796615839004517e-07, 4.731118679046631e-07, 4.98257577419281e-07, 5.234032869338989e-07, 5.485489964485168e-07, 5.736947059631348e-07, 5.988404154777527e-07, 6.239861249923706e-07, 6.491318345069885e-07, 6.742775440216064e-07, 6.994232535362244e-07, 7.245689630508423e-07, 7.497146725654602e-07, 7.748603820800781e-07]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 10.0, 7.0, 14.0, 10.0, 21.0, 44.0, 41.0, 65.0, 80.0, 111.0, 135.0, 219.0, 272.0, 367.0, 550.0, 717.0, 1078.0, 1582.0, 2415.0, 3891.0, 7146.0, 16900.0, 84064.0, 869313.0, 33627.0, 10922.0, 5297.0, 3129.0, 1991.0, 1313.0, 912.0, 647.0, 436.0, 342.0, 242.0, 167.0, 131.0, 99.0, 65.0, 44.0, 31.0, 25.0, 26.0, 14.0, 13.0, 7.0, 5.0, 11.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.0020351409912109375, -0.0019757598638534546, -0.0019163787364959717, -0.0018569976091384888, -0.0017976164817810059, -0.001738235354423523, -0.00167885422706604, -0.0016194730997085571, -0.0015600919723510742, -0.0015007108449935913, -0.0014413297176361084, -0.0013819485902786255, -0.0013225674629211426, -0.0012631863355636597, -0.0012038052082061768, -0.0011444240808486938, -0.001085042953491211, -0.001025661826133728, -0.0009662806987762451, -0.0009068995714187622, -0.0008475184440612793, -0.0007881373167037964, -0.0007287561893463135, -0.0006693750619888306, -0.0006099939346313477, -0.0005506128072738647, -0.0004912316799163818, -0.0004318505525588989, -0.000372469425201416, -0.0003130882978439331, -0.0002537071704864502, -0.00019432604312896729, -0.00013494491577148438, -7.556378841400146e-05, -1.6182661056518555e-05, 4.3198466300964355e-05, 0.00010257959365844727, 0.00016196072101593018, 0.00022134184837341309, 0.000280722975730896, 0.0003401041030883789, 0.0003994852304458618, 0.0004588663578033447, 0.0005182474851608276, 0.0005776286125183105, 0.0006370097398757935, 0.0006963908672332764, 0.0007557719945907593, 0.0008151531219482422, 0.0008745342493057251, 0.000933915376663208, 0.000993296504020691, 0.0010526776313781738, 0.0011120587587356567, 0.0011714398860931396, 0.0012308210134506226, 0.0012902021408081055, 0.0013495832681655884, 0.0014089643955230713, 0.0014683455228805542, 0.0015277266502380371, 0.00158710777759552, 0.001646488904953003, 0.0017058700323104858, 0.0017652511596679688]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 2.0, 3.0, 6.0, 14.0, 17.0, 26.0, 62.0, 512.0, 228.0, 37.0, 27.0, 12.0, 13.0, 5.0, 4.0, 6.0, 2.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005049705505371094, -0.00048692524433135986, -0.00046887993812561035, -0.00045083463191986084, -0.00043278932571411133, -0.0004147440195083618, -0.0003966987133026123, -0.0003786534070968628, -0.0003606081008911133, -0.00034256279468536377, -0.00032451748847961426, -0.00030647218227386475, -0.00028842687606811523, -0.0002703815698623657, -0.0002523362636566162, -0.0002342909574508667, -0.0002162456512451172, -0.00019820034503936768, -0.00018015503883361816, -0.00016210973262786865, -0.00014406442642211914, -0.00012601912021636963, -0.00010797381401062012, -8.99285078048706e-05, -7.18832015991211e-05, -5.383789539337158e-05, -3.579258918762207e-05, -1.774728298187256e-05, 2.980232238769531e-07, 1.8343329429626465e-05, 3.6388635635375977e-05, 5.443394184112549e-05, 7.2479248046875e-05, 9.052455425262451e-05, 0.00010856986045837402, 0.00012661516666412354, 0.00014466047286987305, 0.00016270577907562256, 0.00018075108528137207, 0.00019879639148712158, 0.0002168416976928711, 0.0002348870038986206, 0.0002529323101043701, 0.00027097761631011963, 0.00028902292251586914, 0.00030706822872161865, 0.00032511353492736816, 0.0003431588411331177, 0.0003612041473388672, 0.0003792494535446167, 0.0003972947597503662, 0.0004153400659561157, 0.00043338537216186523, 0.00045143067836761475, 0.00046947598457336426, 0.00048752129077911377, 0.0005055665969848633, 0.0005236119031906128, 0.0005416572093963623, 0.0005597025156021118, 0.0005777478218078613, 0.0005957931280136108, 0.0006138384342193604, 0.0006318837404251099, 0.0006499290466308594]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 3.0, 11.0, 10.0, 8.0, 14.0, 17.0, 23.0, 29.0, 33.0, 45.0, 68.0, 63.0, 93.0, 118.0, 101.0, 68.0, 61.0, 54.0, 48.0, 20.0, 31.0, 11.0, 15.0, 14.0, 7.0, 7.0, 3.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008932476863265038, -0.008596029132604599, -0.008259580470621586, -0.007923132739961147, -0.007586684077978134, -0.007250236347317696, -0.00691378815099597, -0.006577339954674244, -0.006240891758352518, -0.005904443562030792, -0.005567995365709066, -0.0052315471693873405, -0.004895099438726902, -0.004558650776743889, -0.00422220304608345, -0.0038857548497617245, -0.0035493066534399986, -0.0032128584571182728, -0.002876410260796547, -0.0025399622973054647, -0.002203514100983739, -0.001867065904662013, -0.0015306179411709309, -0.001194169744849205, -0.0008577215485274792, -0.0005212734104134142, -0.0001848252722993493, 0.0001516228076070547, 0.00048807100392878056, 0.0008245192002505064, 0.0011609671637415886, 0.0014974153600633144, 0.001833864487707615, 0.0021703126840293407, 0.0025067608803510666, 0.0028432088438421488, 0.0031796570401638746, 0.0035161052364856005, 0.0038525531999766827, 0.0041890013962984085, 0.004525449592620134, 0.00486189778894186, 0.005198345985263586, 0.005534794181585312, 0.00587124191224575, 0.006207690574228764, 0.006544138304889202, 0.006880586501210928, 0.007217034697532654, 0.00755348289385438, 0.007889931090176105, 0.008226378820836544, 0.008562827482819557, 0.008899275213479996, 0.009235722944140434, 0.009572171606123447, 0.00990862026810646, 0.010245067998766899, 0.010581516660749912, 0.01091796439141035, 0.011254413053393364, 0.011590860784053802, 0.011927308514714241, 0.012263757176697254, 0.012600204907357693]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 4.0, 8.0, 14.0, 12.0, 11.0, 22.0, 23.0, 23.0, 28.0, 34.0, 30.0, 41.0, 37.0, 46.0, 39.0, 50.0, 38.0, 48.0, 53.0, 36.0, 52.0, 39.0, 40.0, 39.0, 27.0, 30.0, 30.0, 21.0, 21.0, 25.0, 11.0, 12.0, 15.0, 5.0, 8.0, 5.0, 5.0, 4.0, 8.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.008423611521720886, -0.00816772598773241, -0.007911840453743935, -0.007655955385416746, -0.007400070317089558, -0.007144184783101082, -0.006888299249112606, -0.00663241371512413, -0.006376528646796942, -0.006120643112808466, -0.0058647580444812775, -0.005608872510492802, -0.005352986976504326, -0.005097101908177137, -0.004841216374188662, -0.004585331305861473, -0.004329445771872997, -0.0040735602378845215, -0.003817675169557333, -0.003561789635568857, -0.003305904334411025, -0.003050019033253193, -0.002794133499264717, -0.002538248198106885, -0.002282362896949053, -0.0020264775957912207, -0.0017705921782180667, -0.0015147067606449127, -0.0012588214594870806, -0.0010029361583292484, -0.0007470507407560945, -0.0004911653231829405, -0.00023527909070253372, 2.0606268662959337e-05, 0.0002764916280284524, 0.0005323769873939455, 0.0007882623467594385, 0.0010441476479172707, 0.0013000330654904246, 0.0015559184830635786, 0.0018118037842214108, 0.002067689085379243, 0.002323574386537075, 0.002579459920525551, 0.002835345221683383, 0.003091230522841215, 0.003347116056829691, 0.003603001357987523, 0.0038588866591453552, 0.004114772193133831, 0.0043706572614610195, 0.004626542795449495, 0.004882427863776684, 0.00513831339776516, 0.005394198931753635, 0.005650084465742111, 0.0059059695340693, 0.0061618550680577755, 0.006417740136384964, 0.00667362567037344, 0.006929511204361916, 0.007185396272689104, 0.00744128180667758, 0.007697166875004768, 0.007953052408993244]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 7.0, 7.0, 14.0, 31.0, 50.0, 77.0, 117.0, 209.0, 292.0, 474.0, 659.0, 972.0, 1478.0, 2286.0, 3445.0, 5249.0, 8190.0, 13116.0, 21050.0, 34501.0, 60365.0, 110891.0, 230115.0, 665798.0, 1746725.0, 755284.0, 242303.0, 118353.0, 66897.0, 39127.0, 23729.0, 14682.0, 9570.0, 6123.0, 4010.0, 2609.0, 1717.0, 1175.0, 800.0, 534.0, 384.0, 259.0, 195.0, 119.0, 93.0, 61.0, 33.0, 40.0, 21.0, 14.0, 7.0, 10.0, 11.0, 5.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.00836944580078125, -0.00807642936706543, -0.007783412933349609, -0.007490396499633789, -0.007197380065917969, -0.0069043636322021484, -0.006611347198486328, -0.006318330764770508, -0.0060253143310546875, -0.005732297897338867, -0.005439281463623047, -0.0051462650299072266, -0.004853248596191406, -0.004560232162475586, -0.004267215728759766, -0.003974199295043945, -0.003681182861328125, -0.0033881664276123047, -0.0030951499938964844, -0.002802133560180664, -0.0025091171264648438, -0.0022161006927490234, -0.0019230842590332031, -0.0016300678253173828, -0.0013370513916015625, -0.0010440349578857422, -0.0007510185241699219, -0.00045800209045410156, -0.00016498565673828125, 0.00012803077697753906, 0.0004210472106933594, 0.0007140636444091797, 0.001007080078125, 0.0013000965118408203, 0.0015931129455566406, 0.001886129379272461, 0.0021791458129882812, 0.0024721622467041016, 0.002765178680419922, 0.003058195114135742, 0.0033512115478515625, 0.003644227981567383, 0.003937244415283203, 0.0042302608489990234, 0.004523277282714844, 0.004816293716430664, 0.005109310150146484, 0.005402326583862305, 0.005695343017578125, 0.005988359451293945, 0.006281375885009766, 0.006574392318725586, 0.006867408752441406, 0.0071604251861572266, 0.007453441619873047, 0.007746458053588867, 0.008039474487304688, 0.008332490921020508, 0.008625507354736328, 0.008918523788452148, 0.009211540222167969, 0.009504556655883789, 0.00979757308959961, 0.01009058952331543, 0.01038360595703125]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 12.0, 9.0, 9.0, 11.0, 19.0, 20.0, 19.0, 24.0, 32.0, 29.0, 30.0, 33.0, 39.0, 43.0, 43.0, 41.0, 47.0, 52.0, 38.0, 34.0, 39.0, 47.0, 26.0, 36.0, 33.0, 32.0, 36.0, 19.0, 17.0, 16.0, 21.0, 13.0, 12.0, 10.0, 12.0, 9.0, 1.0, 3.0, 5.0, 5.0, 5.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0039520263671875, -0.0038234591484069824, -0.003694891929626465, -0.0035663247108459473, -0.0034377574920654297, -0.003309190273284912, -0.0031806230545043945, -0.003052055835723877, -0.0029234886169433594, -0.002794921398162842, -0.0026663541793823242, -0.0025377869606018066, -0.002409219741821289, -0.0022806525230407715, -0.002152085304260254, -0.0020235180854797363, -0.0018949508666992188, -0.0017663836479187012, -0.0016378164291381836, -0.001509249210357666, -0.0013806819915771484, -0.0012521147727966309, -0.0011235475540161133, -0.0009949803352355957, -0.0008664131164550781, -0.0007378458976745605, -0.000609278678894043, -0.0004807114601135254, -0.0003521442413330078, -0.00022357702255249023, -9.500980377197266e-05, 3.355741500854492e-05, 0.0001621246337890625, 0.0002906918525695801, 0.00041925907135009766, 0.0005478262901306152, 0.0006763935089111328, 0.0008049607276916504, 0.000933527946472168, 0.0010620951652526855, 0.0011906623840332031, 0.0013192296028137207, 0.0014477968215942383, 0.0015763640403747559, 0.0017049312591552734, 0.001833498477935791, 0.0019620656967163086, 0.002090632915496826, 0.0022192001342773438, 0.0023477673530578613, 0.002476334571838379, 0.0026049017906188965, 0.002733469009399414, 0.0028620362281799316, 0.0029906034469604492, 0.003119170665740967, 0.0032477378845214844, 0.003376305103302002, 0.0035048723220825195, 0.003633439540863037, 0.0037620067596435547, 0.0038905739784240723, 0.00401914119720459, 0.004147708415985107, 0.004276275634765625]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 5.0, 2.0, 8.0, 5.0, 12.0, 15.0, 25.0, 35.0, 70.0, 83.0, 140.0, 185.0, 290.0, 397.0, 631.0, 1006.0, 1527.0, 2255.0, 3525.0, 5459.0, 8955.0, 14131.0, 24284.0, 41897.0, 77004.0, 146928.0, 312754.0, 789304.0, 1550510.0, 650815.0, 269245.0, 129645.0, 68199.0, 37759.0, 21739.0, 13105.0, 8131.0, 5172.0, 3065.0, 2059.0, 1369.0, 881.0, 516.0, 374.0, 245.0, 171.0, 119.0, 85.0, 57.0, 37.0, 22.0, 17.0, 11.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.00762176513671875, -0.007386565208435059, -0.007151365280151367, -0.006916165351867676, -0.006680965423583984, -0.006445765495300293, -0.0062105655670166016, -0.00597536563873291, -0.005740165710449219, -0.005504965782165527, -0.005269765853881836, -0.0050345659255981445, -0.004799365997314453, -0.004564166069030762, -0.00432896614074707, -0.004093766212463379, -0.0038585662841796875, -0.003623366355895996, -0.0033881664276123047, -0.0031529664993286133, -0.002917766571044922, -0.0026825666427612305, -0.002447366714477539, -0.0022121667861938477, -0.0019769668579101562, -0.0017417669296264648, -0.0015065670013427734, -0.001271367073059082, -0.0010361671447753906, -0.0008009672164916992, -0.0005657672882080078, -0.0003305673599243164, -9.5367431640625e-05, 0.0001398324966430664, 0.0003750324249267578, 0.0006102323532104492, 0.0008454322814941406, 0.001080632209777832, 0.0013158321380615234, 0.0015510320663452148, 0.0017862319946289062, 0.0020214319229125977, 0.002256631851196289, 0.0024918317794799805, 0.002727031707763672, 0.0029622316360473633, 0.0031974315643310547, 0.003432631492614746, 0.0036678314208984375, 0.003903031349182129, 0.00413823127746582, 0.004373431205749512, 0.004608631134033203, 0.0048438310623168945, 0.005079030990600586, 0.005314230918884277, 0.005549430847167969, 0.00578463077545166, 0.0060198307037353516, 0.006255030632019043, 0.006490230560302734, 0.006725430488586426, 0.006960630416870117, 0.007195830345153809, 0.0074310302734375]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 8.0, 5.0, 7.0, 5.0, 13.0, 16.0, 21.0, 24.0, 29.0, 44.0, 38.0, 51.0, 61.0, 79.0, 100.0, 139.0, 148.0, 174.0, 230.0, 279.0, 296.0, 332.0, 349.0, 277.0, 221.0, 218.0, 160.0, 141.0, 129.0, 109.0, 82.0, 64.0, 61.0, 40.0, 30.0, 23.0, 21.0, 13.0, 15.0, 4.0, 8.0, 10.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0024127960205078125, -0.002336651086807251, -0.0022605061531066895, -0.002184361219406128, -0.0021082162857055664, -0.002032071352005005, -0.0019559264183044434, -0.0018797814846038818, -0.0018036365509033203, -0.0017274916172027588, -0.0016513466835021973, -0.0015752017498016357, -0.0014990568161010742, -0.0014229118824005127, -0.0013467669486999512, -0.0012706220149993896, -0.0011944770812988281, -0.0011183321475982666, -0.001042187213897705, -0.0009660422801971436, -0.000889897346496582, -0.0008137524127960205, -0.000737607479095459, -0.0006614625453948975, -0.0005853176116943359, -0.0005091726779937744, -0.0004330277442932129, -0.00035688281059265137, -0.00028073787689208984, -0.00020459294319152832, -0.0001284480094909668, -5.2303075790405273e-05, 2.384185791015625e-05, 9.998679161071777e-05, 0.0001761317253112793, 0.0002522766590118408, 0.00032842159271240234, 0.00040456652641296387, 0.0004807114601135254, 0.0005568563938140869, 0.0006330013275146484, 0.00070914626121521, 0.0007852911949157715, 0.000861436128616333, 0.0009375810623168945, 0.001013725996017456, 0.0010898709297180176, 0.001166015863418579, 0.0012421607971191406, 0.0013183057308197021, 0.0013944506645202637, 0.0014705955982208252, 0.0015467405319213867, 0.0016228854656219482, 0.0016990303993225098, 0.0017751753330230713, 0.0018513202667236328, 0.0019274652004241943, 0.002003610134124756, 0.0020797550678253174, 0.002155900001525879, 0.0022320449352264404, 0.002308189868927002, 0.0023843348026275635, 0.002460479736328125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 4.0, 3.0, 6.0, 7.0, 12.0, 17.0, 16.0, 17.0, 18.0, 25.0, 34.0, 49.0, 51.0, 63.0, 76.0, 89.0, 96.0, 77.0, 68.0, 56.0, 33.0, 35.0, 27.0, 25.0, 22.0, 16.0, 16.0, 10.0, 6.0, 4.0, 2.0, 5.0, 3.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.005857475101947784, -0.005668958183377981, -0.005480441264808178, -0.005291924811899662, -0.005103407893329859, -0.0049148909747600555, -0.004726374056190252, -0.004537857137620449, -0.004349340684711933, -0.00416082376614213, -0.003972306847572327, -0.003783790161833167, -0.0035952734760940075, -0.0034067565575242043, -0.003218239638954401, -0.0030297227203845978, -0.0028412058018147945, -0.0026526888832449913, -0.0024641721975058317, -0.0022756552789360285, -0.002087138593196869, -0.0018986216746270657, -0.0017101047560572624, -0.001521587953902781, -0.0013330711517482996, -0.0011445543495938182, -0.0009560374892316759, -0.0007675206288695335, -0.0005790038267150521, -0.0003904870245605707, -0.00020197010599076748, -1.3453303836286068e-05, 0.00017506396397948265, 0.0003635807952377945, 0.0005520976264961064, 0.0007406144868582487, 0.0009291312890127301, 0.0011176480911672115, 0.0013061650097370148, 0.0014946818118914962, 0.0016831986140459776, 0.001871715416200459, 0.0020602322183549404, 0.0022487491369247437, 0.002437266055494547, 0.0026257827412337065, 0.0028142996598035097, 0.0030028163455426693, 0.0031913332641124725, 0.0033798501826822758, 0.0035683668684214354, 0.0037568837869912386, 0.003945400472730398, 0.004133917391300201, 0.004322434309870005, 0.004510951228439808, 0.004699467681348324, 0.004887984599918127, 0.00507650151848793, 0.005265017971396446, 0.0054535348899662495, 0.005642051808536053, 0.005830568727105856, 0.006019085645675659, 0.006207602564245462]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 8.0, 2.0, 4.0, 4.0, 11.0, 7.0, 12.0, 7.0, 14.0, 18.0, 20.0, 20.0, 19.0, 28.0, 26.0, 37.0, 29.0, 44.0, 41.0, 42.0, 31.0, 44.0, 38.0, 33.0, 52.0, 24.0, 38.0, 36.0, 32.0, 31.0, 32.0, 25.0, 20.0, 26.0, 21.0, 20.0, 26.0, 16.0, 10.0, 9.0, 6.0, 10.0, 8.0, 5.0, 4.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.003999910783022642, -0.0038663996383547783, -0.0037328884936869144, -0.0035993773490190506, -0.0034658662043511868, -0.003332355059683323, -0.003198843915015459, -0.003065332770347595, -0.0029318216256797314, -0.0027983104810118675, -0.0026647993363440037, -0.00253128819167614, -0.002397777047008276, -0.002264265902340412, -0.0021307547576725483, -0.0019972436130046844, -0.0018637327011674643, -0.0017302215564996004, -0.0015967104118317366, -0.0014631992671638727, -0.0013296881224960089, -0.001196176977828145, -0.001062665949575603, -0.0009291548049077392, -0.0007956436602398753, -0.0006621325155720115, -0.0005286213709041476, -0.0003951102844439447, -0.00026159913977608085, -0.000128087995108217, 5.423091351985931e-06, 0.00013893423601984978, 0.0002724453806877136, 0.00040595652535557747, 0.0005394676700234413, 0.0006729787564836442, 0.0008064899011515081, 0.0009400010458193719, 0.0010735121322795749, 0.0012070232769474387, 0.0013405344216153026, 0.0014740455662831664, 0.0016075567109510303, 0.0017410677392035723, 0.0018745788838714361, 0.0020080900285393, 0.002141601173207164, 0.0022751123178750277, 0.0024086234625428915, 0.0025421346072107553, 0.002675645751878619, 0.002809156896546483, 0.002942668041214347, 0.0030761791858822107, 0.003209690097719431, 0.0033432012423872948, 0.0034767123870551586, 0.0036102235317230225, 0.0037437346763908863, 0.00387724582105875, 0.004010756965726614, 0.004144268110394478, 0.004277779255062342, 0.0044112903997302055, 0.004544801544398069]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 3.0, 8.0, 7.0, 7.0, 15.0, 10.0, 15.0, 12.0, 28.0, 35.0, 48.0, 74.0, 100.0, 130.0, 186.0, 277.0, 426.0, 619.0, 852.0, 1318.0, 2167.0, 3310.0, 5086.0, 8422.0, 13914.0, 24575.0, 45776.0, 91668.0, 195558.0, 308427.0, 169133.0, 80378.0, 40085.0, 21854.0, 12735.0, 7579.0, 4756.0, 3000.0, 1992.0, 1246.0, 889.0, 580.0, 344.0, 284.0, 178.0, 130.0, 92.0, 65.0, 44.0, 26.0, 26.0, 19.0, 15.0, 10.0, 16.0, 6.0, 6.0, 3.0, 1.0, 3.0, 2.0], "bins": [-0.00281524658203125, -0.002728372812271118, -0.0026414990425109863, -0.0025546252727508545, -0.0024677515029907227, -0.002380877733230591, -0.002294003963470459, -0.002207130193710327, -0.0021202564239501953, -0.0020333826541900635, -0.0019465088844299316, -0.0018596351146697998, -0.001772761344909668, -0.0016858875751495361, -0.0015990138053894043, -0.0015121400356292725, -0.0014252662658691406, -0.0013383924961090088, -0.001251518726348877, -0.0011646449565887451, -0.0010777711868286133, -0.0009908974170684814, -0.0009040236473083496, -0.0008171498775482178, -0.0007302761077880859, -0.0006434023380279541, -0.0005565285682678223, -0.00046965479850769043, -0.0003827810287475586, -0.00029590725898742676, -0.00020903348922729492, -0.00012215971946716309, -3.528594970703125e-05, 5.1587820053100586e-05, 0.00013846158981323242, 0.00022533535957336426, 0.0003122091293334961, 0.00039908289909362793, 0.00048595666885375977, 0.0005728304386138916, 0.0006597042083740234, 0.0007465779781341553, 0.0008334517478942871, 0.0009203255176544189, 0.0010071992874145508, 0.0010940730571746826, 0.0011809468269348145, 0.0012678205966949463, 0.0013546943664550781, 0.00144156813621521, 0.0015284419059753418, 0.0016153156757354736, 0.0017021894454956055, 0.0017890632152557373, 0.0018759369850158691, 0.001962810754776001, 0.002049684524536133, 0.0021365582942962646, 0.0022234320640563965, 0.0023103058338165283, 0.00239717960357666, 0.002484053373336792, 0.002570927143096924, 0.0026578009128570557, 0.0027446746826171875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 3.0, 6.0, 6.0, 6.0, 14.0, 7.0, 13.0, 16.0, 17.0, 14.0, 27.0, 25.0, 31.0, 40.0, 31.0, 33.0, 36.0, 45.0, 42.0, 35.0, 49.0, 44.0, 48.0, 39.0, 34.0, 43.0, 26.0, 33.0, 28.0, 28.0, 29.0, 20.0, 25.0, 22.0, 16.0, 16.0, 8.0, 10.0, 4.0, 3.0, 9.0, 5.0, 6.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.004398345947265625, -0.004252314567565918, -0.004106283187866211, -0.003960251808166504, -0.003814220428466797, -0.00366818904876709, -0.003522157669067383, -0.0033761262893676758, -0.0032300949096679688, -0.0030840635299682617, -0.0029380321502685547, -0.0027920007705688477, -0.0026459693908691406, -0.0024999380111694336, -0.0023539066314697266, -0.0022078752517700195, -0.0020618438720703125, -0.0019158124923706055, -0.0017697811126708984, -0.0016237497329711914, -0.0014777183532714844, -0.0013316869735717773, -0.0011856555938720703, -0.0010396242141723633, -0.0008935928344726562, -0.0007475614547729492, -0.0006015300750732422, -0.00045549869537353516, -0.0003094673156738281, -0.0001634359359741211, -1.7404556274414062e-05, 0.00012862682342529297, 0.000274658203125, 0.00042068958282470703, 0.0005667209625244141, 0.0007127523422241211, 0.0008587837219238281, 0.0010048151016235352, 0.0011508464813232422, 0.0012968778610229492, 0.0014429092407226562, 0.0015889406204223633, 0.0017349720001220703, 0.0018810033798217773, 0.0020270347595214844, 0.0021730661392211914, 0.0023190975189208984, 0.0024651288986206055, 0.0026111602783203125, 0.0027571916580200195, 0.0029032230377197266, 0.0030492544174194336, 0.0031952857971191406, 0.0033413171768188477, 0.0034873485565185547, 0.0036333799362182617, 0.0037794113159179688, 0.003925442695617676, 0.004071474075317383, 0.00421750545501709, 0.004363536834716797, 0.004509568214416504, 0.004655599594116211, 0.004801630973815918, 0.004947662353515625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 1.0, 7.0, 5.0, 12.0, 15.0, 15.0, 25.0, 40.0, 50.0, 76.0, 87.0, 155.0, 185.0, 244.0, 388.0, 566.0, 776.0, 1136.0, 1669.0, 2522.0, 3895.0, 6228.0, 10690.0, 20603.0, 49254.0, 152253.0, 504854.0, 182632.0, 56075.0, 23403.0, 11445.0, 6746.0, 4093.0, 2591.0, 1802.0, 1230.0, 847.0, 524.0, 416.0, 287.0, 200.0, 145.0, 102.0, 74.0, 52.0, 42.0, 32.0, 25.0, 15.0, 6.0, 3.0, 7.0, 8.0, 3.0, 0.0, 0.0, 4.0], "bins": [-0.00449371337890625, -0.004359841346740723, -0.004225969314575195, -0.004092097282409668, -0.003958225250244141, -0.0038243532180786133, -0.003690481185913086, -0.0035566091537475586, -0.0034227371215820312, -0.003288865089416504, -0.0031549930572509766, -0.0030211210250854492, -0.002887248992919922, -0.0027533769607543945, -0.002619504928588867, -0.00248563289642334, -0.0023517608642578125, -0.002217888832092285, -0.002084016799926758, -0.0019501447677612305, -0.0018162727355957031, -0.0016824007034301758, -0.0015485286712646484, -0.001414656639099121, -0.0012807846069335938, -0.0011469125747680664, -0.001013040542602539, -0.0008791685104370117, -0.0007452964782714844, -0.000611424446105957, -0.0004775524139404297, -0.00034368038177490234, -0.000209808349609375, -7.593631744384766e-05, 5.793571472167969e-05, 0.00019180774688720703, 0.0003256797790527344, 0.0004595518112182617, 0.0005934238433837891, 0.0007272958755493164, 0.0008611679077148438, 0.000995039939880371, 0.0011289119720458984, 0.0012627840042114258, 0.0013966560363769531, 0.0015305280685424805, 0.0016644001007080078, 0.0017982721328735352, 0.0019321441650390625, 0.00206601619720459, 0.002199888229370117, 0.0023337602615356445, 0.002467632293701172, 0.0026015043258666992, 0.0027353763580322266, 0.002869248390197754, 0.0030031204223632812, 0.0031369924545288086, 0.003270864486694336, 0.0034047365188598633, 0.0035386085510253906, 0.003672480583190918, 0.0038063526153564453, 0.003940224647521973, 0.0040740966796875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 3.0, 10.0, 6.0, 8.0, 11.0, 12.0, 14.0, 12.0, 11.0, 21.0, 14.0, 22.0, 17.0, 22.0, 33.0, 36.0, 37.0, 32.0, 45.0, 42.0, 32.0, 40.0, 31.0, 40.0, 43.0, 43.0, 20.0, 38.0, 37.0, 25.0, 27.0, 25.0, 24.0, 24.0, 18.0, 24.0, 15.0, 12.0, 10.0, 11.0, 13.0, 8.0, 8.0, 5.0, 8.0, 8.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.0025348663330078125, -0.0024514496326446533, -0.002368032932281494, -0.002284616231918335, -0.0022011995315551758, -0.0021177828311920166, -0.0020343661308288574, -0.0019509494304656982, -0.001867532730102539, -0.0017841160297393799, -0.0017006993293762207, -0.0016172826290130615, -0.0015338659286499023, -0.0014504492282867432, -0.001367032527923584, -0.0012836158275604248, -0.0012001991271972656, -0.0011167824268341064, -0.0010333657264709473, -0.0009499490261077881, -0.0008665323257446289, -0.0007831156253814697, -0.0006996989250183105, -0.0006162822246551514, -0.0005328655242919922, -0.000449448823928833, -0.00036603212356567383, -0.00028261542320251465, -0.00019919872283935547, -0.00011578202247619629, -3.236532211303711e-05, 5.105137825012207e-05, 0.00013446807861328125, 0.00021788477897644043, 0.0003013014793395996, 0.0003847181797027588, 0.00046813488006591797, 0.0005515515804290771, 0.0006349682807922363, 0.0007183849811553955, 0.0008018016815185547, 0.0008852183818817139, 0.000968635082244873, 0.0010520517826080322, 0.0011354684829711914, 0.0012188851833343506, 0.0013023018836975098, 0.001385718584060669, 0.0014691352844238281, 0.0015525519847869873, 0.0016359686851501465, 0.0017193853855133057, 0.0018028020858764648, 0.001886218786239624, 0.001969635486602783, 0.0020530521869659424, 0.0021364688873291016, 0.0022198855876922607, 0.00230330228805542, 0.002386718988418579, 0.0024701356887817383, 0.0025535523891448975, 0.0026369690895080566, 0.002720385789871216, 0.002803802490234375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 8.0, 11.0, 14.0, 11.0, 26.0, 27.0, 43.0, 53.0, 82.0, 151.0, 221.0, 331.0, 569.0, 968.0, 1707.0, 3445.0, 7819.0, 23456.0, 185666.0, 761457.0, 41410.0, 11344.0, 4515.0, 2162.0, 1139.0, 683.0, 438.0, 267.0, 181.0, 111.0, 68.0, 60.0, 36.0, 20.0, 13.0, 6.0, 7.0, 6.0, 8.0, 3.0, 3.0, 8.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0007228851318359375, -0.0007017403841018677, -0.0006805956363677979, -0.000659450888633728, -0.0006383061408996582, -0.0006171613931655884, -0.0005960166454315186, -0.0005748718976974487, -0.0005537271499633789, -0.0005325824022293091, -0.0005114376544952393, -0.0004902929067611694, -0.0004691481590270996, -0.0004480034112930298, -0.00042685866355895996, -0.00040571391582489014, -0.0003845691680908203, -0.0003634244203567505, -0.00034227967262268066, -0.00032113492488861084, -0.000299990177154541, -0.0002788454294204712, -0.00025770068168640137, -0.00023655593395233154, -0.00021541118621826172, -0.0001942664384841919, -0.00017312169075012207, -0.00015197694301605225, -0.00013083219528198242, -0.0001096874475479126, -8.854269981384277e-05, -6.739795207977295e-05, -4.6253204345703125e-05, -2.51084566116333e-05, -3.9637088775634766e-06, 1.7181038856506348e-05, 3.832578659057617e-05, 5.9470534324645996e-05, 8.061528205871582e-05, 0.00010176002979278564, 0.00012290477752685547, 0.0001440495252609253, 0.00016519427299499512, 0.00018633902072906494, 0.00020748376846313477, 0.0002286285161972046, 0.0002497732639312744, 0.00027091801166534424, 0.00029206275939941406, 0.0003132075071334839, 0.0003343522548675537, 0.00035549700260162354, 0.00037664175033569336, 0.0003977864980697632, 0.000418931245803833, 0.00044007599353790283, 0.00046122074127197266, 0.0004823654890060425, 0.0005035102367401123, 0.0005246549844741821, 0.000545799732208252, 0.0005669444799423218, 0.0005880892276763916, 0.0006092339754104614, 0.0006303787231445312]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 6.0, 0.0, 7.0, 13.0, 21.0, 29.0, 0.0, 33.0, 29.0, 68.0, 63.0, 0.0, 89.0, 87.0, 103.0, 111.0, 0.0, 69.0, 71.0, 54.0, 43.0, 0.0, 29.0, 32.0, 13.0, 9.0, 0.0, 9.0, 8.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5497207641601562e-06, -1.5022233128547668e-06, -1.4547258615493774e-06, -1.407228410243988e-06, -1.3597309589385986e-06, -1.3122335076332092e-06, -1.2647360563278198e-06, -1.2172386050224304e-06, -1.169741153717041e-06, -1.1222437024116516e-06, -1.0747462511062622e-06, -1.0272487998008728e-06, -9.797513484954834e-07, -9.32253897190094e-07, -8.847564458847046e-07, -8.372589945793152e-07, -7.897615432739258e-07, -7.422640919685364e-07, -6.94766640663147e-07, -6.472691893577576e-07, -5.997717380523682e-07, -5.522742867469788e-07, -5.047768354415894e-07, -4.5727938413619995e-07, -4.0978193283081055e-07, -3.6228448152542114e-07, -3.1478703022003174e-07, -2.6728957891464233e-07, -2.1979212760925293e-07, -1.7229467630386353e-07, -1.2479722499847412e-07, -7.729977369308472e-08, -2.9802322387695312e-08, 1.7695128917694092e-08, 6.51925802230835e-08, 1.126900315284729e-07, 1.601874828338623e-07, 2.076849341392517e-07, 2.551823854446411e-07, 3.026798367500305e-07, 3.501772880554199e-07, 3.976747393608093e-07, 4.4517219066619873e-07, 4.926696419715881e-07, 5.401670932769775e-07, 5.876645445823669e-07, 6.351619958877563e-07, 6.826594471931458e-07, 7.301568984985352e-07, 7.776543498039246e-07, 8.25151801109314e-07, 8.726492524147034e-07, 9.201467037200928e-07, 9.676441550254822e-07, 1.0151416063308716e-06, 1.062639057636261e-06, 1.1101365089416504e-06, 1.1576339602470398e-06, 1.2051314115524292e-06, 1.2526288628578186e-06, 1.300126314163208e-06, 1.3476237654685974e-06, 1.3951212167739868e-06, 1.4426186680793762e-06, 1.4901161193847656e-06]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [8.0, 5.0, 12.0, 13.0, 15.0, 26.0, 36.0, 35.0, 62.0, 61.0, 110.0, 130.0, 184.0, 215.0, 270.0, 359.0, 452.0, 591.0, 745.0, 985.0, 1399.0, 1770.0, 2499.0, 3255.0, 4845.0, 6747.0, 11060.0, 19079.0, 39595.0, 112457.0, 541012.0, 183059.0, 53249.0, 23872.0, 12698.0, 7859.0, 5334.0, 3677.0, 2655.0, 1949.0, 1436.0, 1057.0, 780.0, 658.0, 473.0, 367.0, 310.0, 237.0, 202.0, 157.0, 119.0, 92.0, 68.0, 57.0, 40.0, 34.0, 29.0, 26.0, 18.0, 8.0, 9.0, 9.0, 3.0, 3.0], "bins": [-0.0004565715789794922, -0.0004416815936565399, -0.00042679160833358765, -0.0004119016230106354, -0.0003970116376876831, -0.00038212165236473083, -0.00036723166704177856, -0.0003523416817188263, -0.000337451696395874, -0.00032256171107292175, -0.0003076717257499695, -0.0002927817404270172, -0.00027789175510406494, -0.00026300176978111267, -0.0002481117844581604, -0.00023322179913520813, -0.00021833181381225586, -0.0002034418284893036, -0.00018855184316635132, -0.00017366185784339905, -0.00015877187252044678, -0.0001438818871974945, -0.00012899190187454224, -0.00011410191655158997, -9.92119312286377e-05, -8.432194590568542e-05, -6.943196058273315e-05, -5.4541975259780884e-05, -3.965198993682861e-05, -2.4762004613876343e-05, -9.872019290924072e-06, 5.017966032028198e-06, 1.990795135498047e-05, 3.479793667793274e-05, 4.968792200088501e-05, 6.457790732383728e-05, 7.946789264678955e-05, 9.435787796974182e-05, 0.00010924786329269409, 0.00012413784861564636, 0.00013902783393859863, 0.0001539178192615509, 0.00016880780458450317, 0.00018369778990745544, 0.00019858777523040771, 0.00021347776055335999, 0.00022836774587631226, 0.00024325773119926453, 0.0002581477165222168, 0.00027303770184516907, 0.00028792768716812134, 0.0003028176724910736, 0.0003177076578140259, 0.00033259764313697815, 0.0003474876284599304, 0.0003623776137828827, 0.00037726759910583496, 0.00039215758442878723, 0.0004070475697517395, 0.00042193755507469177, 0.00043682754039764404, 0.0004517175257205963, 0.0004666075110435486, 0.00048149749636650085, 0.0004963874816894531]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 4.0, 4.0, 14.0, 8.0, 5.0, 9.0, 15.0, 16.0, 27.0, 26.0, 45.0, 59.0, 59.0, 125.0, 138.0, 118.0, 68.0, 43.0, 46.0, 37.0, 26.0, 25.0, 17.0, 13.0, 9.0, 11.0, 5.0, 8.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00014448165893554688, -0.00014015287160873413, -0.0001358240842819214, -0.00013149529695510864, -0.0001271665096282959, -0.00012283772230148315, -0.00011850893497467041, -0.00011418014764785767, -0.00010985136032104492, -0.00010552257299423218, -0.00010119378566741943, -9.686499834060669e-05, -9.253621101379395e-05, -8.82074236869812e-05, -8.387863636016846e-05, -7.954984903335571e-05, -7.522106170654297e-05, -7.089227437973022e-05, -6.656348705291748e-05, -6.223469972610474e-05, -5.790591239929199e-05, -5.357712507247925e-05, -4.9248337745666504e-05, -4.491955041885376e-05, -4.0590763092041016e-05, -3.626197576522827e-05, -3.193318843841553e-05, -2.7604401111602783e-05, -2.327561378479004e-05, -1.8946826457977295e-05, -1.461803913116455e-05, -1.0289251804351807e-05, -5.9604644775390625e-06, -1.6316771507263184e-06, 2.6971101760864258e-06, 7.02589750289917e-06, 1.1354684829711914e-05, 1.5683472156524658e-05, 2.0012259483337402e-05, 2.4341046810150146e-05, 2.866983413696289e-05, 3.2998621463775635e-05, 3.732740879058838e-05, 4.165619611740112e-05, 4.598498344421387e-05, 5.031377077102661e-05, 5.4642558097839355e-05, 5.89713454246521e-05, 6.330013275146484e-05, 6.762892007827759e-05, 7.195770740509033e-05, 7.628649473190308e-05, 8.061528205871582e-05, 8.494406938552856e-05, 8.927285671234131e-05, 9.360164403915405e-05, 9.79304313659668e-05, 0.00010225921869277954, 0.00010658800601959229, 0.00011091679334640503, 0.00011524558067321777, 0.00011957436800003052, 0.00012390315532684326, 0.000128231942653656, 0.00013256072998046875]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 2.0, 5.0, 5.0, 11.0, 9.0, 19.0, 17.0, 12.0, 23.0, 25.0, 26.0, 47.0, 51.0, 64.0, 67.0, 77.0, 96.0, 80.0, 70.0, 55.0, 42.0, 33.0, 33.0, 22.0, 19.0, 18.0, 12.0, 16.0, 10.0, 3.0, 6.0, 2.0, 3.0, 4.0, 6.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.005790685303509235, -0.00561134098097682, -0.005431996658444405, -0.0052526528015732765, -0.005073308479040861, -0.004893964156508446, -0.004714620299637318, -0.004535275977104902, -0.004355931654572487, -0.0041765873320400715, -0.003997243009507656, -0.003817899152636528, -0.0036385548301041126, -0.0034592105075716972, -0.0032798664178699255, -0.0031005223281681538, -0.0029211780056357384, -0.002741833683103323, -0.0025624895934015512, -0.0023831455036997795, -0.002203801181167364, -0.0020244568586349487, -0.001845112768933177, -0.0016657685628160834, -0.0014864243566989899, -0.0013070801505818963, -0.0011277359444648027, -0.0009483917383477092, -0.0007690475322306156, -0.000589703326113522, -0.0004103591199964285, -0.00023101491387933493, -5.167117342352867e-05, 0.0001276730326935649, 0.00030701723881065845, 0.000486361444927752, 0.0006657056510448456, 0.0008450498571619391, 0.0010243940632790327, 0.0012037382693961263, 0.0013830824755132198, 0.0015624266816303134, 0.001741770887747407, 0.0019211150938645005, 0.002100459299981594, 0.0022798036225140095, 0.002459147712215781, 0.002638491801917553, 0.0028178361244499683, 0.0029971804469823837, 0.0031765245366841555, 0.003355868626385927, 0.0035352129489183426, 0.003714557271450758, 0.0038939013611525297, 0.0040732454508543015, 0.004252589773386717, 0.004431934095919132, 0.00461127795279026, 0.004790622275322676, 0.004969966597855091, 0.0051493109203875065, 0.005328655242919922, 0.00550799909979105, 0.005687343422323465]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 5.0, 4.0, 7.0, 10.0, 9.0, 11.0, 13.0, 16.0, 17.0, 24.0, 18.0, 22.0, 28.0, 38.0, 27.0, 41.0, 42.0, 44.0, 35.0, 41.0, 37.0, 32.0, 49.0, 32.0, 37.0, 31.0, 36.0, 23.0, 42.0, 26.0, 19.0, 25.0, 23.0, 22.0, 21.0, 21.0, 8.0, 12.0, 6.0, 10.0, 8.0, 4.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.004079313483089209, -0.0039454260841012, -0.0038115386851131916, -0.003677651286125183, -0.003543763654306531, -0.0034098762553185225, -0.003275988856330514, -0.0031421014573425055, -0.0030082138255238533, -0.002874326426535845, -0.0027404390275478363, -0.002606551628559828, -0.0024726639967411757, -0.002338776597753167, -0.0022048891987651587, -0.00207100179977715, -0.0019371144007891417, -0.0018032270018011332, -0.0016693394863978028, -0.0015354520874097943, -0.001401564572006464, -0.0012676771730184555, -0.001133789774030447, -0.0009999023750424385, -0.0008660148596391082, -0.0007321274024434388, -0.0005982399452477694, -0.00046435254625976086, -0.00033046508906409144, -0.00019657763186842203, -6.269023288041353e-05, 7.119722431525588e-05, 0.0002050846815109253, 0.0003389721387065947, 0.00047285956679843366, 0.0006067469948902726, 0.000740634452085942, 0.0008745219092816114, 0.00100840930826962, 0.0011422967072576284, 0.0012761842226609588, 0.0014100716216489673, 0.0015439591370522976, 0.001677846536040306, 0.0018117339350283146, 0.001945621450431645, 0.0020795087330043316, 0.0022133963648229837, 0.0023472837638109922, 0.0024811711627990007, 0.0026150585617870092, 0.0027489461936056614, 0.00288283359259367, 0.0030167209915816784, 0.003150608390569687, 0.0032844957895576954, 0.003418383188545704, 0.0035522705875337124, 0.003686157986521721, 0.0038200453855097294, 0.003953932784497738, 0.004087820649147034, 0.004221707582473755, 0.004355595447123051, 0.004489482846111059]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 4.0, 7.0, 9.0, 14.0, 28.0, 49.0, 74.0, 130.0, 193.0, 295.0, 483.0, 682.0, 1043.0, 1743.0, 2698.0, 4349.0, 6999.0, 11636.0, 19496.0, 33566.0, 61426.0, 121964.0, 265663.0, 257069.0, 117897.0, 59645.0, 33044.0, 18628.0, 11285.0, 6849.0, 4228.0, 2671.0, 1686.0, 1127.0, 677.0, 432.0, 281.0, 186.0, 108.0, 69.0, 39.0, 33.0, 19.0, 12.0, 14.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00958251953125, -0.009273171424865723, -0.008963823318481445, -0.008654475212097168, -0.00834512710571289, -0.008035778999328613, -0.007726430892944336, -0.007417082786560059, -0.007107734680175781, -0.006798386573791504, -0.0064890384674072266, -0.006179690361022949, -0.005870342254638672, -0.0055609941482543945, -0.005251646041870117, -0.00494229793548584, -0.0046329498291015625, -0.004323601722717285, -0.004014253616333008, -0.0037049055099487305, -0.003395557403564453, -0.0030862092971801758, -0.0027768611907958984, -0.002467513084411621, -0.0021581649780273438, -0.0018488168716430664, -0.001539468765258789, -0.0012301206588745117, -0.0009207725524902344, -0.000611424446105957, -0.0003020763397216797, 7.271766662597656e-06, 0.000316619873046875, 0.0006259679794311523, 0.0009353160858154297, 0.001244664192199707, 0.0015540122985839844, 0.0018633604049682617, 0.002172708511352539, 0.0024820566177368164, 0.0027914047241210938, 0.003100752830505371, 0.0034101009368896484, 0.0037194490432739258, 0.004028797149658203, 0.0043381452560424805, 0.004647493362426758, 0.004956841468811035, 0.0052661895751953125, 0.00557553768157959, 0.005884885787963867, 0.0061942338943481445, 0.006503582000732422, 0.006812930107116699, 0.0071222782135009766, 0.007431626319885254, 0.007740974426269531, 0.008050322532653809, 0.008359670639038086, 0.008669018745422363, 0.00897836685180664, 0.009287714958190918, 0.009597063064575195, 0.009906411170959473, 0.01021575927734375]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 5.0, 8.0, 10.0, 9.0, 6.0, 14.0, 15.0, 15.0, 19.0, 27.0, 18.0, 19.0, 23.0, 32.0, 30.0, 41.0, 45.0, 28.0, 36.0, 40.0, 43.0, 42.0, 37.0, 41.0, 33.0, 43.0, 34.0, 25.0, 39.0, 22.0, 22.0, 26.0, 21.0, 19.0, 23.0, 18.0, 13.0, 9.0, 5.0, 8.0, 6.0, 7.0, 2.0, 5.0, 4.0, 5.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.00362396240234375, -0.0035122036933898926, -0.003400444984436035, -0.0032886862754821777, -0.0031769275665283203, -0.003065168857574463, -0.0029534101486206055, -0.002841651439666748, -0.0027298927307128906, -0.002618134021759033, -0.0025063753128051758, -0.0023946166038513184, -0.002282857894897461, -0.0021710991859436035, -0.002059340476989746, -0.0019475817680358887, -0.0018358230590820312, -0.0017240643501281738, -0.0016123056411743164, -0.001500546932220459, -0.0013887882232666016, -0.0012770295143127441, -0.0011652708053588867, -0.0010535120964050293, -0.0009417533874511719, -0.0008299946784973145, -0.000718235969543457, -0.0006064772605895996, -0.0004947185516357422, -0.00038295984268188477, -0.00027120113372802734, -0.00015944242477416992, -4.76837158203125e-05, 6.407499313354492e-05, 0.00017583370208740234, 0.00028759241104125977, 0.0003993511199951172, 0.0005111098289489746, 0.000622868537902832, 0.0007346272468566895, 0.0008463859558105469, 0.0009581446647644043, 0.0010699033737182617, 0.0011816620826721191, 0.0012934207916259766, 0.001405179500579834, 0.0015169382095336914, 0.0016286969184875488, 0.0017404556274414062, 0.0018522143363952637, 0.001963973045349121, 0.0020757317543029785, 0.002187490463256836, 0.0022992491722106934, 0.0024110078811645508, 0.002522766590118408, 0.0026345252990722656, 0.002746284008026123, 0.0028580427169799805, 0.002969801425933838, 0.0030815601348876953, 0.0031933188438415527, 0.00330507755279541, 0.0034168362617492676, 0.003528594970703125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 9.0, 14.0, 17.0, 30.0, 31.0, 55.0, 74.0, 121.0, 206.0, 271.0, 392.0, 633.0, 917.0, 1304.0, 2000.0, 3164.0, 4850.0, 7340.0, 11389.0, 18683.0, 30325.0, 51370.0, 90945.0, 166071.0, 261987.0, 168908.0, 91916.0, 52635.0, 30851.0, 18928.0, 11759.0, 7376.0, 4663.0, 3212.0, 2033.0, 1347.0, 909.0, 602.0, 432.0, 249.0, 181.0, 116.0, 69.0, 61.0, 48.0, 30.0, 17.0, 7.0, 8.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00789642333984375, -0.007645845413208008, -0.007395267486572266, -0.0071446895599365234, -0.006894111633300781, -0.006643533706665039, -0.006392955780029297, -0.006142377853393555, -0.0058917999267578125, -0.00564122200012207, -0.005390644073486328, -0.005140066146850586, -0.004889488220214844, -0.0046389102935791016, -0.004388332366943359, -0.004137754440307617, -0.003887176513671875, -0.003636598587036133, -0.0033860206604003906, -0.0031354427337646484, -0.0028848648071289062, -0.002634286880493164, -0.002383708953857422, -0.0021331310272216797, -0.0018825531005859375, -0.0016319751739501953, -0.0013813972473144531, -0.001130819320678711, -0.0008802413940429688, -0.0006296634674072266, -0.0003790855407714844, -0.0001285076141357422, 0.0001220703125, 0.0003726482391357422, 0.0006232261657714844, 0.0008738040924072266, 0.0011243820190429688, 0.001374959945678711, 0.0016255378723144531, 0.0018761157989501953, 0.0021266937255859375, 0.0023772716522216797, 0.002627849578857422, 0.002878427505493164, 0.0031290054321289062, 0.0033795833587646484, 0.0036301612854003906, 0.003880739212036133, 0.004131317138671875, 0.004381895065307617, 0.004632472991943359, 0.0048830509185791016, 0.005133628845214844, 0.005384206771850586, 0.005634784698486328, 0.00588536262512207, 0.0061359405517578125, 0.006386518478393555, 0.006637096405029297, 0.006887674331665039, 0.007138252258300781, 0.0073888301849365234, 0.007639408111572266, 0.007889986038208008, 0.00814056396484375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 3.0, 3.0, 8.0, 9.0, 10.0, 11.0, 17.0, 8.0, 13.0, 19.0, 18.0, 35.0, 35.0, 31.0, 36.0, 34.0, 41.0, 38.0, 39.0, 44.0, 50.0, 44.0, 36.0, 40.0, 39.0, 36.0, 45.0, 42.0, 31.0, 32.0, 26.0, 23.0, 16.0, 7.0, 11.0, 17.0, 11.0, 12.0, 10.0, 8.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025310516357421875, -0.0024531781673431396, -0.002375304698944092, -0.002297431230545044, -0.002219557762145996, -0.0021416842937469482, -0.0020638108253479004, -0.0019859373569488525, -0.0019080638885498047, -0.0018301904201507568, -0.001752316951751709, -0.0016744434833526611, -0.0015965700149536133, -0.0015186965465545654, -0.0014408230781555176, -0.0013629496097564697, -0.0012850761413574219, -0.001207202672958374, -0.0011293292045593262, -0.0010514557361602783, -0.0009735822677612305, -0.0008957087993621826, -0.0008178353309631348, -0.0007399618625640869, -0.0006620883941650391, -0.0005842149257659912, -0.0005063414573669434, -0.0004284679889678955, -0.00035059452056884766, -0.0002727210521697998, -0.00019484758377075195, -0.0001169741153717041, -3.910064697265625e-05, 3.87728214263916e-05, 0.00011664628982543945, 0.0001945197582244873, 0.00027239322662353516, 0.000350266695022583, 0.00042814016342163086, 0.0005060136318206787, 0.0005838871002197266, 0.0006617605686187744, 0.0007396340370178223, 0.0008175075054168701, 0.000895380973815918, 0.0009732544422149658, 0.0010511279106140137, 0.0011290013790130615, 0.0012068748474121094, 0.0012847483158111572, 0.001362621784210205, 0.001440495252609253, 0.0015183687210083008, 0.0015962421894073486, 0.0016741156578063965, 0.0017519891262054443, 0.0018298625946044922, 0.00190773606300354, 0.001985609531402588, 0.0020634829998016357, 0.0021413564682006836, 0.0022192299365997314, 0.0022971034049987793, 0.002374976873397827, 0.002452850341796875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 5.0, 15.0, 7.0, 17.0, 21.0, 41.0, 50.0, 72.0, 111.0, 143.0, 211.0, 273.0, 400.0, 539.0, 785.0, 1057.0, 1532.0, 2192.0, 3254.0, 4853.0, 7211.0, 11365.0, 21131.0, 62095.0, 734730.0, 127217.0, 28956.0, 14058.0, 8414.0, 5555.0, 3655.0, 2511.0, 1799.0, 1215.0, 885.0, 657.0, 440.0, 293.0, 233.0, 145.0, 138.0, 82.0, 67.0, 41.0, 29.0, 20.0, 18.0, 10.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004620552062988281, -0.00044699758291244507, -0.000431939959526062, -0.00041688233613967896, -0.0004018247127532959, -0.00038676708936691284, -0.0003717094659805298, -0.00035665184259414673, -0.00034159421920776367, -0.0003265365958213806, -0.00031147897243499756, -0.0002964213490486145, -0.00028136372566223145, -0.0002663061022758484, -0.00025124847888946533, -0.00023619085550308228, -0.00022113323211669922, -0.00020607560873031616, -0.0001910179853439331, -0.00017596036195755005, -0.000160902738571167, -0.00014584511518478394, -0.00013078749179840088, -0.00011572986841201782, -0.00010067224502563477, -8.561462163925171e-05, -7.055699825286865e-05, -5.5499374866485596e-05, -4.044175148010254e-05, -2.5384128093719482e-05, -1.0326504707336426e-05, 4.731118679046631e-06, 1.9788742065429688e-05, 3.4846365451812744e-05, 4.99039888381958e-05, 6.496161222457886e-05, 8.001923561096191e-05, 9.507685899734497e-05, 0.00011013448238372803, 0.00012519210577011108, 0.00014024972915649414, 0.0001553073525428772, 0.00017036497592926025, 0.0001854225993156433, 0.00020048022270202637, 0.00021553784608840942, 0.00023059546947479248, 0.00024565309286117554, 0.0002607107162475586, 0.00027576833963394165, 0.0002908259630203247, 0.00030588358640670776, 0.0003209412097930908, 0.0003359988331794739, 0.00035105645656585693, 0.00036611407995224, 0.00038117170333862305, 0.0003962293267250061, 0.00041128695011138916, 0.0004263445734977722, 0.0004414021968841553, 0.00045645982027053833, 0.0004715174436569214, 0.00048657506704330444, 0.0005016326904296875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 4.0, 0.0, 9.0, 0.0, 13.0, 0.0, 14.0, 0.0, 19.0, 0.0, 36.0, 0.0, 62.0, 0.0, 87.0, 0.0, 166.0, 0.0, 187.0, 0.0, 161.0, 0.0, 101.0, 0.0, 61.0, 0.0, 32.0, 0.0, 24.0, 0.0, 18.0, 0.0, 4.0, 0.0, 7.0, 0.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0728836059570312e-06, -1.043081283569336e-06, -1.0132789611816406e-06, -9.834766387939453e-07, -9.5367431640625e-07, -9.238719940185547e-07, -8.940696716308594e-07, -8.642673492431641e-07, -8.344650268554688e-07, -8.046627044677734e-07, -7.748603820800781e-07, -7.450580596923828e-07, -7.152557373046875e-07, -6.854534149169922e-07, -6.556510925292969e-07, -6.258487701416016e-07, -5.960464477539062e-07, -5.662441253662109e-07, -5.364418029785156e-07, -5.066394805908203e-07, -4.76837158203125e-07, -4.470348358154297e-07, -4.172325134277344e-07, -3.8743019104003906e-07, -3.5762786865234375e-07, -3.2782554626464844e-07, -2.980232238769531e-07, -2.682209014892578e-07, -2.384185791015625e-07, -2.086162567138672e-07, -1.7881393432617188e-07, -1.4901161193847656e-07, -1.1920928955078125e-07, -8.940696716308594e-08, -5.960464477539063e-08, -2.9802322387695312e-08, 0.0, 2.9802322387695312e-08, 5.960464477539063e-08, 8.940696716308594e-08, 1.1920928955078125e-07, 1.4901161193847656e-07, 1.7881393432617188e-07, 2.086162567138672e-07, 2.384185791015625e-07, 2.682209014892578e-07, 2.980232238769531e-07, 3.2782554626464844e-07, 3.5762786865234375e-07, 3.8743019104003906e-07, 4.172325134277344e-07, 4.470348358154297e-07, 4.76837158203125e-07, 5.066394805908203e-07, 5.364418029785156e-07, 5.662441253662109e-07, 5.960464477539062e-07, 6.258487701416016e-07, 6.556510925292969e-07, 6.854534149169922e-07, 7.152557373046875e-07, 7.450580596923828e-07, 7.748603820800781e-07, 8.046627044677734e-07, 8.344650268554688e-07]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 8.0, 14.0, 16.0, 23.0, 29.0, 37.0, 61.0, 70.0, 115.0, 167.0, 242.0, 341.0, 603.0, 871.0, 1388.0, 2305.0, 3939.0, 6880.0, 13007.0, 26276.0, 145350.0, 775518.0, 34611.0, 16095.0, 8511.0, 4727.0, 2745.0, 1622.0, 1003.0, 637.0, 423.0, 287.0, 196.0, 121.0, 105.0, 57.0, 45.0, 28.0, 23.0, 22.0, 10.0, 8.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.00101470947265625, -0.0009874030947685242, -0.0009600967168807983, -0.0009327903389930725, -0.0009054839611053467, -0.0008781775832176208, -0.000850871205329895, -0.0008235648274421692, -0.0007962584495544434, -0.0007689520716667175, -0.0007416456937789917, -0.0007143393158912659, -0.00068703293800354, -0.0006597265601158142, -0.0006324201822280884, -0.0006051138043403625, -0.0005778074264526367, -0.0005505010485649109, -0.0005231946706771851, -0.0004958882927894592, -0.0004685819149017334, -0.00044127553701400757, -0.00041396915912628174, -0.0003866627812385559, -0.0003593564033508301, -0.00033205002546310425, -0.0003047436475753784, -0.0002774372696876526, -0.00025013089179992676, -0.00022282451391220093, -0.0001955181360244751, -0.00016821175813674927, -0.00014090538024902344, -0.00011359900236129761, -8.629262447357178e-05, -5.898624658584595e-05, -3.167986869812012e-05, -4.373490810394287e-06, 2.2932887077331543e-05, 5.023926496505737e-05, 7.75456428527832e-05, 0.00010485202074050903, 0.00013215839862823486, 0.0001594647765159607, 0.00018677115440368652, 0.00021407753229141235, 0.00024138391017913818, 0.000268690288066864, 0.00029599666595458984, 0.0003233030438423157, 0.0003506094217300415, 0.00037791579961776733, 0.00040522217750549316, 0.000432528555393219, 0.0004598349332809448, 0.00048714131116867065, 0.0005144476890563965, 0.0005417540669441223, 0.0005690604448318481, 0.000596366822719574, 0.0006236732006072998, 0.0006509795784950256, 0.0006782859563827515, 0.0007055923342704773, 0.0007328987121582031]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 4.0, 6.0, 8.0, 6.0, 15.0, 9.0, 10.0, 13.0, 16.0, 55.0, 200.0, 437.0, 80.0, 32.0, 8.0, 7.0, 13.0, 8.0, 10.0, 8.0, 7.0, 8.0, 7.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00023818016052246094, -0.00023177079856395721, -0.0002253614366054535, -0.00021895207464694977, -0.00021254271268844604, -0.00020613335072994232, -0.0001997239887714386, -0.00019331462681293488, -0.00018690526485443115, -0.00018049590289592743, -0.0001740865409374237, -0.00016767717897891998, -0.00016126781702041626, -0.00015485845506191254, -0.0001484490931034088, -0.0001420397311449051, -0.00013563036918640137, -0.00012922100722789764, -0.00012281164526939392, -0.0001164022833108902, -0.00010999292135238647, -0.00010358355939388275, -9.717419743537903e-05, -9.07648354768753e-05, -8.435547351837158e-05, -7.794611155986786e-05, -7.153674960136414e-05, -6.512738764286041e-05, -5.871802568435669e-05, -5.2308663725852966e-05, -4.589930176734924e-05, -3.948993980884552e-05, -3.30805778503418e-05, -2.6671215891838074e-05, -2.026185393333435e-05, -1.3852491974830627e-05, -7.443130016326904e-06, -1.0337680578231812e-06, 5.375593900680542e-06, 1.1784955859184265e-05, 1.8194317817687988e-05, 2.460367977619171e-05, 3.1013041734695435e-05, 3.742240369319916e-05, 4.383176565170288e-05, 5.0241127610206604e-05, 5.665048956871033e-05, 6.305985152721405e-05, 6.946921348571777e-05, 7.58785754442215e-05, 8.228793740272522e-05, 8.869729936122894e-05, 9.510666131973267e-05, 0.00010151602327823639, 0.00010792538523674011, 0.00011433474719524384, 0.00012074410915374756, 0.00012715347111225128, 0.000133562833070755, 0.00013997219502925873, 0.00014638155698776245, 0.00015279091894626617, 0.0001592002809047699, 0.00016560964286327362, 0.00017201900482177734]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 3.0, 2.0, 9.0, 7.0, 11.0, 9.0, 19.0, 19.0, 22.0, 25.0, 37.0, 40.0, 48.0, 52.0, 67.0, 80.0, 89.0, 65.0, 81.0, 61.0, 41.0, 32.0, 39.0, 34.0, 23.0, 13.0, 9.0, 13.0, 6.0, 5.0, 8.0, 3.0, 3.0, 5.0, 4.0, 2.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004254987463355064, -0.004101085476577282, -0.003947183024138212, -0.0037932810373604298, -0.0036393788177520037, -0.0034854765981435776, -0.003331574611365795, -0.003177672391757369, -0.003023770172148943, -0.002869867952540517, -0.0027159659657627344, -0.0025620637461543083, -0.0024081615265458822, -0.002254259306937456, -0.0021003573201596737, -0.0019464551005512476, -0.0017925531137734652, -0.0016386510105803609, -0.0014847487909719348, -0.0013308466877788305, -0.0011769444681704044, -0.0010230423649773002, -0.0008691402617841959, -0.0007152380421757698, -0.0005613359389826655, -0.00040743377758190036, -0.00025353164528496563, -9.962951298803091e-05, 5.427264841273427e-05, 0.00020817480981349945, 0.0003620769130066037, 0.0005159791326150298, 0.0006698812358081341, 0.0008237833972088993, 0.0009776855586096644, 0.0011315876618027687, 0.0012854898814111948, 0.001439391984604299, 0.0015932940877974033, 0.0017471963074058294, 0.0019010984105989337, 0.002055000513792038, 0.002208902733400464, 0.00236280495300889, 0.0025167069397866726, 0.0026706091593950987, 0.0028245113790035248, 0.0029784133657813072, 0.0031323155853897333, 0.0032862178049981594, 0.003440119791775942, 0.003594022011384368, 0.003747924230992794, 0.0039018262177705765, 0.004055728204548359, 0.004209630656987429, 0.004363532643765211, 0.0045174346305429935, 0.004671337082982063, 0.004825239069759846, 0.004979141056537628, 0.005133043508976698, 0.00528694549575448, 0.00544084794819355, 0.0055947499349713326]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 5.0, 3.0, 3.0, 3.0, 1.0, 5.0, 14.0, 10.0, 6.0, 17.0, 9.0, 16.0, 21.0, 26.0, 25.0, 34.0, 28.0, 30.0, 44.0, 49.0, 38.0, 43.0, 37.0, 27.0, 36.0, 38.0, 29.0, 40.0, 40.0, 39.0, 35.0, 36.0, 21.0, 20.0, 24.0, 22.0, 13.0, 18.0, 23.0, 19.0, 11.0, 13.0, 5.0, 5.0, 3.0, 6.0, 4.0, 8.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.003549294313415885, -0.003433592850342393, -0.003317891387268901, -0.0032021901570260525, -0.0030864886939525604, -0.0029707872308790684, -0.0028550857678055763, -0.0027393843047320843, -0.0026236828416585922, -0.0025079813785851, -0.002392279915511608, -0.002276578452438116, -0.0021608772221952677, -0.0020451757591217756, -0.0019294742960482836, -0.0018137728329747915, -0.0016980716027319431, -0.001582370139658451, -0.0014666687930002809, -0.0013509673299267888, -0.0012352659832686186, -0.0011195645201951265, -0.0010038630571216345, -0.0008881616522558033, -0.0007724602473899722, -0.0006567588425241411, -0.0005410574376583099, -0.0004253559745848179, -0.00030965456971898675, -0.0001939531648531556, -7.825170177966356e-05, 3.7449703086167574e-05, 0.00015315134078264236, 0.0002688527456484735, 0.0003845541796181351, 0.0005002556135877967, 0.0006159570184536278, 0.000731658423319459, 0.000847359886392951, 0.0009630612912587821, 0.0010787626961246133, 0.0011944641591981053, 0.0013101655058562756, 0.0014258669689297676, 0.0015415684320032597, 0.0016572697786614299, 0.001772971241734922, 0.0018886725883930922, 0.002004374051466584, 0.0021200755145400763, 0.0022357769776135683, 0.0023514782078564167, 0.0024671796709299088, 0.002582881134003401, 0.002698582597076893, 0.002814284060150385, 0.002929985523223877, 0.003045686986297369, 0.003161388449370861, 0.003277089912444353, 0.0033927911426872015, 0.0035084926057606936, 0.0036241940688341856, 0.0037398955319076777, 0.003855596762150526]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 6.0, 11.0, 5.0, 17.0, 32.0, 42.0, 52.0, 85.0, 124.0, 176.0, 268.0, 377.0, 553.0, 835.0, 1273.0, 1931.0, 3049.0, 4917.0, 8667.0, 15127.0, 28040.0, 55162.0, 120087.0, 325135.0, 1494499.0, 1542309.0, 343466.0, 125350.0, 56647.0, 28378.0, 15303.0, 8918.0, 5098.0, 2977.0, 1875.0, 1156.0, 785.0, 465.0, 352.0, 234.0, 176.0, 92.0, 82.0, 49.0, 38.0, 24.0, 13.0, 12.0, 7.0, 4.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.006534576416015625, -0.006323873996734619, -0.006113171577453613, -0.005902469158172607, -0.0056917667388916016, -0.005481064319610596, -0.00527036190032959, -0.005059659481048584, -0.004848957061767578, -0.004638254642486572, -0.004427552223205566, -0.0042168498039245605, -0.004006147384643555, -0.003795444965362549, -0.003584742546081543, -0.003374040126800537, -0.0031633377075195312, -0.0029526352882385254, -0.0027419328689575195, -0.0025312304496765137, -0.002320528030395508, -0.002109825611114502, -0.001899123191833496, -0.0016884207725524902, -0.0014777183532714844, -0.0012670159339904785, -0.0010563135147094727, -0.0008456110954284668, -0.0006349086761474609, -0.0004242062568664551, -0.00021350383758544922, -2.8014183044433594e-06, 0.0002079010009765625, 0.00041860342025756836, 0.0006293058395385742, 0.0008400082588195801, 0.001050710678100586, 0.0012614130973815918, 0.0014721155166625977, 0.0016828179359436035, 0.0018935203552246094, 0.0021042227745056152, 0.002314925193786621, 0.002525627613067627, 0.002736330032348633, 0.0029470324516296387, 0.0031577348709106445, 0.0033684372901916504, 0.0035791397094726562, 0.003789842128753662, 0.004000544548034668, 0.004211246967315674, 0.00442194938659668, 0.0046326518058776855, 0.004843354225158691, 0.005054056644439697, 0.005264759063720703, 0.005475461483001709, 0.005686163902282715, 0.005896866321563721, 0.0061075687408447266, 0.006318271160125732, 0.006528973579406738, 0.006739675998687744, 0.00695037841796875]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 3.0, 8.0, 8.0, 7.0, 13.0, 14.0, 11.0, 18.0, 18.0, 24.0, 24.0, 30.0, 48.0, 36.0, 41.0, 33.0, 41.0, 45.0, 50.0, 46.0, 43.0, 40.0, 42.0, 42.0, 36.0, 43.0, 32.0, 27.0, 26.0, 17.0, 27.0, 20.0, 17.0, 13.0, 16.0, 5.0, 3.0, 8.0, 7.0, 4.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00243377685546875, -0.0023565292358398438, -0.0022792816162109375, -0.0022020339965820312, -0.002124786376953125, -0.0020475387573242188, -0.0019702911376953125, -0.0018930435180664062, -0.0018157958984375, -0.0017385482788085938, -0.0016613006591796875, -0.0015840530395507812, -0.001506805419921875, -0.0014295578002929688, -0.0013523101806640625, -0.0012750625610351562, -0.00119781494140625, -0.0011205673217773438, -0.0010433197021484375, -0.0009660720825195312, -0.000888824462890625, -0.0008115768432617188, -0.0007343292236328125, -0.0006570816040039062, -0.000579833984375, -0.0005025863647460938, -0.0004253387451171875, -0.00034809112548828125, -0.000270843505859375, -0.00019359588623046875, -0.0001163482666015625, -3.910064697265625e-05, 3.814697265625e-05, 0.00011539459228515625, 0.0001926422119140625, 0.00026988983154296875, 0.000347137451171875, 0.00042438507080078125, 0.0005016326904296875, 0.0005788803100585938, 0.0006561279296875, 0.0007333755493164062, 0.0008106231689453125, 0.0008878707885742188, 0.000965118408203125, 0.0010423660278320312, 0.0011196136474609375, 0.0011968612670898438, 0.00127410888671875, 0.0013513565063476562, 0.0014286041259765625, 0.0015058517456054688, 0.001583099365234375, 0.0016603469848632812, 0.0017375946044921875, 0.0018148422241210938, 0.00189208984375, 0.0019693374633789062, 0.0020465850830078125, 0.0021238327026367188, 0.002201080322265625, 0.0022783279418945312, 0.0023555755615234375, 0.0024328231811523438, 0.00251007080078125]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 4.0, 9.0, 9.0, 15.0, 21.0, 22.0, 30.0, 55.0, 91.0, 118.0, 157.0, 254.0, 385.0, 530.0, 764.0, 1187.0, 1782.0, 2689.0, 4277.0, 6895.0, 11214.0, 19817.0, 36826.0, 72971.0, 161063.0, 406311.0, 1236886.0, 1411783.0, 464524.0, 179329.0, 80353.0, 39894.0, 21335.0, 12008.0, 7435.0, 4612.0, 2932.0, 1948.0, 1169.0, 843.0, 553.0, 342.0, 261.0, 187.0, 135.0, 81.0, 54.0, 43.0, 28.0, 14.0, 16.0, 11.0, 7.0, 9.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.0046844482421875, -0.004533648490905762, -0.0043828487396240234, -0.004232048988342285, -0.004081249237060547, -0.003930449485778809, -0.0037796497344970703, -0.003628849983215332, -0.0034780502319335938, -0.0033272504806518555, -0.003176450729370117, -0.003025650978088379, -0.0028748512268066406, -0.0027240514755249023, -0.002573251724243164, -0.0024224519729614258, -0.0022716522216796875, -0.0021208524703979492, -0.001970052719116211, -0.0018192529678344727, -0.0016684532165527344, -0.001517653465270996, -0.0013668537139892578, -0.0012160539627075195, -0.0010652542114257812, -0.000914454460144043, -0.0007636547088623047, -0.0006128549575805664, -0.0004620552062988281, -0.00031125545501708984, -0.00016045570373535156, -9.655952453613281e-06, 0.000141143798828125, 0.0002919435501098633, 0.00044274330139160156, 0.0005935430526733398, 0.0007443428039550781, 0.0008951425552368164, 0.0010459423065185547, 0.001196742057800293, 0.0013475418090820312, 0.0014983415603637695, 0.0016491413116455078, 0.001799941062927246, 0.0019507408142089844, 0.0021015405654907227, 0.002252340316772461, 0.0024031400680541992, 0.0025539398193359375, 0.0027047395706176758, 0.002855539321899414, 0.0030063390731811523, 0.0031571388244628906, 0.003307938575744629, 0.003458738327026367, 0.0036095380783081055, 0.0037603378295898438, 0.003911137580871582, 0.00406193733215332, 0.004212737083435059, 0.004363536834716797, 0.004514336585998535, 0.0046651363372802734, 0.004815936088562012, 0.00496673583984375]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 9.0, 4.0, 7.0, 11.0, 10.0, 14.0, 11.0, 15.0, 14.0, 15.0, 33.0, 24.0, 39.0, 62.0, 71.0, 85.0, 115.0, 127.0, 135.0, 194.0, 239.0, 302.0, 320.0, 334.0, 306.0, 262.0, 218.0, 197.0, 170.0, 134.0, 98.0, 96.0, 73.0, 67.0, 58.0, 51.0, 27.0, 19.0, 22.0, 19.0, 17.0, 11.0, 10.0, 9.0, 5.0, 6.0, 4.0, 5.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00130462646484375, -0.0012645721435546875, -0.001224517822265625, -0.0011844635009765625, -0.0011444091796875, -0.0011043548583984375, -0.001064300537109375, -0.0010242462158203125, -0.00098419189453125, -0.0009441375732421875, -0.000904083251953125, -0.0008640289306640625, -0.000823974609375, -0.0007839202880859375, -0.000743865966796875, -0.0007038116455078125, -0.00066375732421875, -0.0006237030029296875, -0.000583648681640625, -0.0005435943603515625, -0.0005035400390625, -0.0004634857177734375, -0.000423431396484375, -0.0003833770751953125, -0.00034332275390625, -0.0003032684326171875, -0.000263214111328125, -0.0002231597900390625, -0.00018310546875, -0.0001430511474609375, -0.000102996826171875, -6.29425048828125e-05, -2.288818359375e-05, 1.71661376953125e-05, 5.7220458984375e-05, 9.72747802734375e-05, 0.0001373291015625, 0.0001773834228515625, 0.000217437744140625, 0.0002574920654296875, 0.00029754638671875, 0.0003376007080078125, 0.000377655029296875, 0.0004177093505859375, 0.000457763671875, 0.0004978179931640625, 0.000537872314453125, 0.0005779266357421875, 0.00061798095703125, 0.0006580352783203125, 0.000698089599609375, 0.0007381439208984375, 0.0007781982421875, 0.0008182525634765625, 0.000858306884765625, 0.0008983612060546875, 0.00093841552734375, 0.0009784698486328125, 0.001018524169921875, 0.0010585784912109375, 0.0010986328125, 0.0011386871337890625, 0.001178741455078125, 0.0012187957763671875, 0.00125885009765625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 7.0, 4.0, 9.0, 7.0, 11.0, 11.0, 17.0, 19.0, 23.0, 28.0, 38.0, 54.0, 57.0, 66.0, 82.0, 85.0, 87.0, 70.0, 62.0, 52.0, 40.0, 38.0, 27.0, 22.0, 10.0, 12.0, 12.0, 5.0, 8.0, 3.0, 6.0, 7.0, 6.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0026902512181550264, -0.002582498360425234, -0.0024747455026954412, -0.0023669926449656487, -0.002259239787235856, -0.0021514869295060635, -0.0020437343046069145, -0.0019359813304618, -0.0018282284727320075, -0.001720475615002215, -0.0016127227572724223, -0.0015049700159579515, -0.001397217158228159, -0.0012894643004983664, -0.0011817114427685738, -0.0010739585850387812, -0.0009662057273089886, -0.000858452869579196, -0.0007507000118494034, -0.0006429472123272717, -0.0005351943545974791, -0.0004274414968676865, -0.00031968869734555483, -0.00021193583961576223, -0.00010418298188596964, 3.5698612919077277e-06, 0.0001113227044697851, 0.00021907553309574723, 0.00032682839082553983, 0.0004345812485553324, 0.0005423340480774641, 0.0006500869058072567, 0.000757839996367693, 0.0008655928540974855, 0.0009733457118272781, 0.0010810985695570707, 0.0011888514272868633, 0.001296604285016656, 0.0014043570263311267, 0.0015121098840609193, 0.0016198627417907119, 0.0017276155995205045, 0.001835368457250297, 0.0019431211985647678, 0.0020508740562945604, 0.002158626914024353, 0.0022663797717541456, 0.0023741326294839382, 0.002481885487213731, 0.0025896383449435234, 0.002697391202673316, 0.0028051440604031086, 0.002912896918132901, 0.003020649775862694, 0.0031284024007618427, 0.003236155491322279, 0.003343908116221428, 0.0034516609739512205, 0.003559413831681013, 0.0036671666894108057, 0.0037749195471405983, 0.003882672404870391, 0.0039904252626001835, 0.004098177887499332, 0.004205930978059769]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 1.0, 7.0, 5.0, 2.0, 5.0, 10.0, 10.0, 9.0, 10.0, 14.0, 14.0, 13.0, 21.0, 32.0, 35.0, 24.0, 41.0, 36.0, 44.0, 32.0, 29.0, 36.0, 47.0, 39.0, 53.0, 38.0, 30.0, 36.0, 38.0, 43.0, 43.0, 28.0, 19.0, 23.0, 25.0, 25.0, 12.0, 10.0, 7.0, 12.0, 12.0, 8.0, 9.0, 4.0, 5.0, 3.0, 0.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.002179201925173402, -0.0021003512665629387, -0.0020215006079524755, -0.0019426500657573342, -0.001863799407146871, -0.001784948748536408, -0.0017060982063412666, -0.0016272475477308035, -0.0015483968891203403, -0.0014695462305098772, -0.001390695571899414, -0.0013118450297042727, -0.0012329943710938096, -0.0011541437124833465, -0.0010752931702882051, -0.000996442511677742, -0.0009175918530672789, -0.0008387411944568157, -0.0007598905940540135, -0.0006810399936512113, -0.0006021893350407481, -0.000523338676430285, -0.00044448807602748275, -0.0003656374756246805, -0.0002867868170142174, -0.0002079361875075847, -0.000129085558000952, -5.023492849431932e-05, 2.8615701012313366e-05, 0.00010746633051894605, 0.00018631696002557874, 0.00026516756042838097, 0.00034401845186948776, 0.00042286908137612045, 0.0005017197108827531, 0.0005805703112855554, 0.0006594209698960185, 0.0007382716285064816, 0.0008171222289092839, 0.0008959728293120861, 0.0009748234879225492, 0.0010536741465330124, 0.0011325248051434755, 0.0012113753473386168, 0.00129022600594908, 0.0013690766645595431, 0.0014479272067546844, 0.0015267778653651476, 0.0016056285239756107, 0.0016844791825860739, 0.001763329841196537, 0.0018421803833916783, 0.0019210310420021415, 0.001999881584197283, 0.002078732242807746, 0.002157582901418209, 0.0022364335600286722, 0.0023152842186391354, 0.0023941348772495985, 0.0024729855358600616, 0.002551835961639881, 0.0026306866202503443, 0.0027095372788608074, 0.0027883879374712706, 0.0028672385960817337]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 6.0, 3.0, 13.0, 15.0, 21.0, 35.0, 47.0, 73.0, 121.0, 190.0, 280.0, 490.0, 815.0, 1570.0, 3258.0, 7885.0, 20963.0, 64962.0, 248722.0, 495588.0, 139343.0, 39669.0, 13657.0, 5513.0, 2410.0, 1199.0, 670.0, 386.0, 233.0, 156.0, 81.0, 60.0, 35.0, 30.0, 16.0, 13.0, 11.0, 5.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00211334228515625, -0.0020359158515930176, -0.001958489418029785, -0.0018810629844665527, -0.0018036365509033203, -0.0017262101173400879, -0.0016487836837768555, -0.001571357250213623, -0.0014939308166503906, -0.0014165043830871582, -0.0013390779495239258, -0.0012616515159606934, -0.001184225082397461, -0.0011067986488342285, -0.001029372215270996, -0.0009519457817077637, -0.0008745193481445312, -0.0007970929145812988, -0.0007196664810180664, -0.000642240047454834, -0.0005648136138916016, -0.00048738718032836914, -0.0004099607467651367, -0.0003325343132019043, -0.0002551078796386719, -0.00017768144607543945, -0.00010025501251220703, -2.282857894897461e-05, 5.459785461425781e-05, 0.00013202428817749023, 0.00020945072174072266, 0.0002868771553039551, 0.0003643035888671875, 0.0004417300224304199, 0.0005191564559936523, 0.0005965828895568848, 0.0006740093231201172, 0.0007514357566833496, 0.000828862190246582, 0.0009062886238098145, 0.0009837150573730469, 0.0010611414909362793, 0.0011385679244995117, 0.0012159943580627441, 0.0012934207916259766, 0.001370847225189209, 0.0014482736587524414, 0.0015257000923156738, 0.0016031265258789062, 0.0016805529594421387, 0.001757979393005371, 0.0018354058265686035, 0.001912832260131836, 0.0019902586936950684, 0.0020676851272583008, 0.002145111560821533, 0.0022225379943847656, 0.002299964427947998, 0.0023773908615112305, 0.002454817295074463, 0.0025322437286376953, 0.0026096701622009277, 0.00268709659576416, 0.0027645230293273926, 0.002841949462890625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 1.0, 5.0, 7.0, 5.0, 11.0, 10.0, 5.0, 20.0, 13.0, 10.0, 24.0, 23.0, 20.0, 30.0, 34.0, 40.0, 40.0, 34.0, 39.0, 35.0, 49.0, 47.0, 43.0, 39.0, 43.0, 33.0, 28.0, 45.0, 37.0, 38.0, 34.0, 28.0, 20.0, 19.0, 16.0, 12.0, 10.0, 3.0, 8.0, 8.0, 7.0, 7.0, 7.0, 5.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0023517608642578125, -0.002268075942993164, -0.0021843910217285156, -0.002100706100463867, -0.0020170211791992188, -0.0019333362579345703, -0.0018496513366699219, -0.0017659664154052734, -0.001682281494140625, -0.0015985965728759766, -0.0015149116516113281, -0.0014312267303466797, -0.0013475418090820312, -0.0012638568878173828, -0.0011801719665527344, -0.001096487045288086, -0.0010128021240234375, -0.0009291172027587891, -0.0008454322814941406, -0.0007617473602294922, -0.0006780624389648438, -0.0005943775177001953, -0.0005106925964355469, -0.00042700767517089844, -0.00034332275390625, -0.00025963783264160156, -0.00017595291137695312, -9.226799011230469e-05, -8.58306884765625e-06, 7.510185241699219e-05, 0.00015878677368164062, 0.00024247169494628906, 0.0003261566162109375, 0.00040984153747558594, 0.0004935264587402344, 0.0005772113800048828, 0.0006608963012695312, 0.0007445812225341797, 0.0008282661437988281, 0.0009119510650634766, 0.000995635986328125, 0.0010793209075927734, 0.0011630058288574219, 0.0012466907501220703, 0.0013303756713867188, 0.0014140605926513672, 0.0014977455139160156, 0.001581430435180664, 0.0016651153564453125, 0.001748800277709961, 0.0018324851989746094, 0.0019161701202392578, 0.0019998550415039062, 0.0020835399627685547, 0.002167224884033203, 0.0022509098052978516, 0.0023345947265625, 0.0024182796478271484, 0.002501964569091797, 0.0025856494903564453, 0.0026693344116210938, 0.002753019332885742, 0.0028367042541503906, 0.002920389175415039, 0.0030040740966796875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 7.0, 9.0, 8.0, 16.0, 26.0, 30.0, 32.0, 75.0, 87.0, 122.0, 205.0, 286.0, 350.0, 494.0, 758.0, 1265.0, 2095.0, 3753.0, 7643.0, 16658.0, 45924.0, 178215.0, 565346.0, 152128.0, 41438.0, 15363.0, 6932.0, 3592.0, 2122.0, 1227.0, 763.0, 476.0, 345.0, 223.0, 135.0, 117.0, 75.0, 56.0, 36.0, 29.0, 26.0, 23.0, 15.0, 13.0, 8.0, 1.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.002529144287109375, -0.002453535795211792, -0.002377927303314209, -0.002302318811416626, -0.002226710319519043, -0.00215110182762146, -0.002075493335723877, -0.001999884843826294, -0.001924276351928711, -0.001848667860031128, -0.001773059368133545, -0.001697450876235962, -0.001621842384338379, -0.001546233892440796, -0.0014706254005432129, -0.0013950169086456299, -0.0013194084167480469, -0.0012437999248504639, -0.0011681914329528809, -0.0010925829410552979, -0.0010169744491577148, -0.0009413659572601318, -0.0008657574653625488, -0.0007901489734649658, -0.0007145404815673828, -0.0006389319896697998, -0.0005633234977722168, -0.0004877150058746338, -0.0004121065139770508, -0.0003364980220794678, -0.00026088953018188477, -0.00018528103828430176, -0.00010967254638671875, -3.406405448913574e-05, 4.1544437408447266e-05, 0.00011715292930603027, 0.00019276142120361328, 0.0002683699131011963, 0.0003439784049987793, 0.0004195868968963623, 0.0004951953887939453, 0.0005708038806915283, 0.0006464123725891113, 0.0007220208644866943, 0.0007976293563842773, 0.0008732378482818604, 0.0009488463401794434, 0.0010244548320770264, 0.0011000633239746094, 0.0011756718158721924, 0.0012512803077697754, 0.0013268887996673584, 0.0014024972915649414, 0.0014781057834625244, 0.0015537142753601074, 0.0016293227672576904, 0.0017049312591552734, 0.0017805397510528564, 0.0018561482429504395, 0.0019317567348480225, 0.0020073652267456055, 0.0020829737186431885, 0.0021585822105407715, 0.0022341907024383545, 0.0023097991943359375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 7.0, 6.0, 1.0, 10.0, 7.0, 8.0, 13.0, 16.0, 11.0, 24.0, 23.0, 29.0, 25.0, 27.0, 39.0, 28.0, 41.0, 33.0, 40.0, 42.0, 30.0, 49.0, 40.0, 41.0, 34.0, 37.0, 40.0, 30.0, 28.0, 26.0, 32.0, 31.0, 27.0, 23.0, 19.0, 17.0, 19.0, 7.0, 9.0, 7.0, 6.0, 7.0, 8.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0016803741455078125, -0.0016296952962875366, -0.0015790164470672607, -0.0015283375978469849, -0.001477658748626709, -0.001426979899406433, -0.0013763010501861572, -0.0013256222009658813, -0.0012749433517456055, -0.0012242645025253296, -0.0011735856533050537, -0.0011229068040847778, -0.001072227954864502, -0.001021549105644226, -0.0009708702564239502, -0.0009201914072036743, -0.0008695125579833984, -0.0008188337087631226, -0.0007681548595428467, -0.0007174760103225708, -0.0006667971611022949, -0.000616118311882019, -0.0005654394626617432, -0.0005147606134414673, -0.0004640817642211914, -0.00041340291500091553, -0.00036272406578063965, -0.00031204521656036377, -0.0002613663673400879, -0.000210687518119812, -0.00016000866889953613, -0.00010932981967926025, -5.8650970458984375e-05, -7.972121238708496e-06, 4.270672798156738e-05, 9.338557720184326e-05, 0.00014406442642211914, 0.00019474327564239502, 0.0002454221248626709, 0.0002961009740829468, 0.00034677982330322266, 0.00039745867252349854, 0.0004481375217437744, 0.0004988163709640503, 0.0005494952201843262, 0.000600174069404602, 0.0006508529186248779, 0.0007015317678451538, 0.0007522106170654297, 0.0008028894662857056, 0.0008535683155059814, 0.0009042471647262573, 0.0009549260139465332, 0.001005604863166809, 0.001056283712387085, 0.0011069625616073608, 0.0011576414108276367, 0.0012083202600479126, 0.0012589991092681885, 0.0013096779584884644, 0.0013603568077087402, 0.0014110356569290161, 0.001461714506149292, 0.0015123933553695679, 0.0015630722045898438]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 10.0, 7.0, 10.0, 15.0, 19.0, 25.0, 32.0, 50.0, 67.0, 89.0, 126.0, 152.0, 249.0, 283.0, 407.0, 563.0, 789.0, 1162.0, 1787.0, 2654.0, 4232.0, 7491.0, 14474.0, 32064.0, 100057.0, 627274.0, 170185.0, 42982.0, 17759.0, 8997.0, 5001.0, 3028.0, 1975.0, 1305.0, 883.0, 604.0, 439.0, 352.0, 253.0, 187.0, 133.0, 113.0, 68.0, 62.0, 47.0, 27.0, 21.0, 18.0, 11.0, 7.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0001627206802368164, -0.00015757977962493896, -0.00015243887901306152, -0.00014729797840118408, -0.00014215707778930664, -0.0001370161771774292, -0.00013187527656555176, -0.00012673437595367432, -0.00012159347534179688, -0.00011645257472991943, -0.00011131167411804199, -0.00010617077350616455, -0.00010102987289428711, -9.588897228240967e-05, -9.074807167053223e-05, -8.560717105865479e-05, -8.046627044677734e-05, -7.53253698348999e-05, -7.018446922302246e-05, -6.504356861114502e-05, -5.990266799926758e-05, -5.476176738739014e-05, -4.9620866775512695e-05, -4.4479966163635254e-05, -3.933906555175781e-05, -3.419816493988037e-05, -2.905726432800293e-05, -2.3916363716125488e-05, -1.8775463104248047e-05, -1.3634562492370605e-05, -8.493661880493164e-06, -3.3527612686157227e-06, 1.7881393432617188e-06, 6.92903995513916e-06, 1.2069940567016602e-05, 1.7210841178894043e-05, 2.2351741790771484e-05, 2.7492642402648926e-05, 3.263354301452637e-05, 3.777444362640381e-05, 4.291534423828125e-05, 4.805624485015869e-05, 5.319714546203613e-05, 5.8338046073913574e-05, 6.347894668579102e-05, 6.861984729766846e-05, 7.37607479095459e-05, 7.890164852142334e-05, 8.404254913330078e-05, 8.918344974517822e-05, 9.432435035705566e-05, 9.94652509689331e-05, 0.00010460615158081055, 0.00010974705219268799, 0.00011488795280456543, 0.00012002885341644287, 0.0001251697540283203, 0.00013031065464019775, 0.0001354515552520752, 0.00014059245586395264, 0.00014573335647583008, 0.00015087425708770752, 0.00015601515769958496, 0.0001611560583114624, 0.00016629695892333984]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 8.0, 11.0, 0.0, 13.0, 0.0, 15.0, 0.0, 24.0, 0.0, 39.0, 0.0, 55.0, 51.0, 0.0, 70.0, 0.0, 90.0, 0.0, 88.0, 0.0, 93.0, 0.0, 77.0, 72.0, 0.0, 82.0, 0.0, 50.0, 0.0, 49.0, 0.0, 34.0, 0.0, 26.0, 16.0, 0.0, 15.0, 0.0, 8.0, 0.0, 6.0, 0.0, 6.0, 0.0, 3.0, 3.0, 0.0, 4.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.5367431640625e-07, -9.210780262947083e-07, -8.884817361831665e-07, -8.558854460716248e-07, -8.23289155960083e-07, -7.906928658485413e-07, -7.580965757369995e-07, -7.255002856254578e-07, -6.92903995513916e-07, -6.603077054023743e-07, -6.277114152908325e-07, -5.951151251792908e-07, -5.62518835067749e-07, -5.299225449562073e-07, -4.973262548446655e-07, -4.647299647331238e-07, -4.3213367462158203e-07, -3.995373845100403e-07, -3.6694109439849854e-07, -3.343448042869568e-07, -3.0174851417541504e-07, -2.691522240638733e-07, -2.3655593395233154e-07, -2.039596438407898e-07, -1.7136335372924805e-07, -1.387670636177063e-07, -1.0617077350616455e-07, -7.35744833946228e-08, -4.0978193283081055e-08, -8.381903171539307e-09, 2.421438694000244e-08, 5.681067705154419e-08, 8.940696716308594e-08, 1.2200325727462769e-07, 1.5459954738616943e-07, 1.8719583749771118e-07, 2.1979212760925293e-07, 2.523884177207947e-07, 2.849847078323364e-07, 3.175809979438782e-07, 3.501772880554199e-07, 3.8277357816696167e-07, 4.153698682785034e-07, 4.4796615839004517e-07, 4.805624485015869e-07, 5.131587386131287e-07, 5.457550287246704e-07, 5.783513188362122e-07, 6.109476089477539e-07, 6.435438990592957e-07, 6.761401891708374e-07, 7.087364792823792e-07, 7.413327693939209e-07, 7.739290595054626e-07, 8.065253496170044e-07, 8.391216397285461e-07, 8.717179298400879e-07, 9.043142199516296e-07, 9.369105100631714e-07, 9.695068001747131e-07, 1.0021030902862549e-06, 1.0346993803977966e-06, 1.0672956705093384e-06, 1.0998919606208801e-06, 1.1324882507324219e-06]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 13.0, 12.0, 15.0, 27.0, 22.0, 39.0, 65.0, 82.0, 117.0, 159.0, 265.0, 357.0, 520.0, 844.0, 1208.0, 1904.0, 2924.0, 4844.0, 8074.0, 14721.0, 28952.0, 63089.0, 183158.0, 492334.0, 136199.0, 52351.0, 24474.0, 12576.0, 7144.0, 4270.0, 2589.0, 1717.0, 1092.0, 769.0, 494.0, 352.0, 238.0, 170.0, 118.0, 66.0, 55.0, 43.0, 21.0, 25.0, 13.0, 10.0, 11.0, 2.0, 2.0, 1.0, 6.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.0003018379211425781, -0.0002925172448158264, -0.0002831965684890747, -0.000273875892162323, -0.0002645552158355713, -0.0002552345395088196, -0.00024591386318206787, -0.00023659318685531616, -0.00022727251052856445, -0.00021795183420181274, -0.00020863115787506104, -0.00019931048154830933, -0.00018998980522155762, -0.0001806691288948059, -0.0001713484525680542, -0.0001620277762413025, -0.00015270709991455078, -0.00014338642358779907, -0.00013406574726104736, -0.00012474507093429565, -0.00011542439460754395, -0.00010610371828079224, -9.678304195404053e-05, -8.746236562728882e-05, -7.814168930053711e-05, -6.88210129737854e-05, -5.950033664703369e-05, -5.017966032028198e-05, -4.0858983993530273e-05, -3.1538307666778564e-05, -2.2217631340026855e-05, -1.2896955013275146e-05, -3.5762786865234375e-06, 5.7443976402282715e-06, 1.506507396697998e-05, 2.438575029373169e-05, 3.37064266204834e-05, 4.302710294723511e-05, 5.2347779273986816e-05, 6.166845560073853e-05, 7.098913192749023e-05, 8.030980825424194e-05, 8.963048458099365e-05, 9.895116090774536e-05, 0.00010827183723449707, 0.00011759251356124878, 0.0001269131898880005, 0.0001362338662147522, 0.0001455545425415039, 0.00015487521886825562, 0.00016419589519500732, 0.00017351657152175903, 0.00018283724784851074, 0.00019215792417526245, 0.00020147860050201416, 0.00021079927682876587, 0.00022011995315551758, 0.0002294406294822693, 0.000238761305809021, 0.0002480819821357727, 0.0002574026584625244, 0.0002667233347892761, 0.00027604401111602783, 0.00028536468744277954, 0.00029468536376953125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 3.0, 5.0, 3.0, 7.0, 2.0, 6.0, 12.0, 5.0, 6.0, 9.0, 13.0, 7.0, 12.0, 12.0, 24.0, 14.0, 20.0, 30.0, 60.0, 76.0, 86.0, 87.0, 108.0, 94.0, 73.0, 36.0, 31.0, 24.0, 18.0, 21.0, 13.0, 16.0, 12.0, 6.0, 7.0, 9.0, 8.0, 4.0, 9.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.821487426757812e-05, -8.553359657526016e-05, -8.28523188829422e-05, -8.017104119062424e-05, -7.748976349830627e-05, -7.480848580598831e-05, -7.212720811367035e-05, -6.944593042135239e-05, -6.676465272903442e-05, -6.408337503671646e-05, -6.14020973443985e-05, -5.8720819652080536e-05, -5.603954195976257e-05, -5.335826426744461e-05, -5.067698657512665e-05, -4.7995708882808685e-05, -4.531443119049072e-05, -4.263315349817276e-05, -3.99518758058548e-05, -3.7270598113536835e-05, -3.458932042121887e-05, -3.190804272890091e-05, -2.9226765036582947e-05, -2.6545487344264984e-05, -2.386420965194702e-05, -2.118293195962906e-05, -1.8501654267311096e-05, -1.5820376574993134e-05, -1.3139098882675171e-05, -1.0457821190357208e-05, -7.776543498039246e-06, -5.095265805721283e-06, -2.4139881134033203e-06, 2.6728957891464233e-07, 2.948567271232605e-06, 5.629844963550568e-06, 8.31112265586853e-06, 1.0992400348186493e-05, 1.3673678040504456e-05, 1.6354955732822418e-05, 1.903623342514038e-05, 2.1717511117458344e-05, 2.4398788809776306e-05, 2.708006650209427e-05, 2.976134419441223e-05, 3.2442621886730194e-05, 3.512389957904816e-05, 3.780517727136612e-05, 4.048645496368408e-05, 4.3167732656002045e-05, 4.584901034832001e-05, 4.853028804063797e-05, 5.121156573295593e-05, 5.3892843425273895e-05, 5.657412111759186e-05, 5.925539880990982e-05, 6.193667650222778e-05, 6.461795419454575e-05, 6.729923188686371e-05, 6.998050957918167e-05, 7.266178727149963e-05, 7.53430649638176e-05, 7.802434265613556e-05, 8.070562034845352e-05, 8.338689804077148e-05]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 4.0, 3.0, 4.0, 4.0, 7.0, 9.0, 13.0, 11.0, 14.0, 11.0, 34.0, 30.0, 36.0, 51.0, 60.0, 81.0, 82.0, 89.0, 91.0, 65.0, 56.0, 54.0, 34.0, 45.0, 22.0, 14.0, 17.0, 9.0, 9.0, 9.0, 2.0, 2.0, 8.0, 7.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028534336015582085, -0.0027424762956798077, -0.002631518989801407, -0.002520561683923006, -0.0024096043780446053, -0.0022986470721662045, -0.0021876897662878036, -0.002076732460409403, -0.001965775154531002, -0.0018548178486526012, -0.0017438605427742004, -0.0016329032368957996, -0.0015219459310173988, -0.001410988625138998, -0.0013000312028452754, -0.0011890738969668746, -0.001078116474673152, -0.0009671591687947512, -0.0008562018629163504, -0.0007452444988302886, -0.0006342871929518878, -0.000523329887073487, -0.00041237252298742533, -0.0003014152171090245, -0.00019045791123062372, -7.950059080030769e-05, 3.145672963000834e-05, 0.0001424140646122396, 0.0002533713704906404, 0.0003643286763690412, 0.0004752860404551029, 0.0005862433463335037, 0.0006972006522119045, 0.0008081579580903053, 0.0009191152639687061, 0.001030072569847107, 0.0011410298757255077, 0.0012519871816039085, 0.0013629446038976312, 0.001473901909776032, 0.0015848592156544328, 0.0016958165215328336, 0.0018067738274112344, 0.001917731249704957, 0.002028688555583358, 0.0021396458614617586, 0.0022506031673401594, 0.0023615604732185602, 0.002472517779096961, 0.002583475084975362, 0.0026944323908537626, 0.0028053896967321634, 0.0029163470026105642, 0.003027304308488965, 0.0031382618471980095, 0.0032492191530764103, 0.003360176458954811, 0.003471133764833212, 0.0035820910707116127, 0.0036930483765900135, 0.0038040056824684143, 0.003914962988346815, 0.004025920294225216, 0.004136877600103617, 0.0042478349059820175]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 4.0, 4.0, 5.0, 10.0, 11.0, 9.0, 11.0, 14.0, 15.0, 11.0, 26.0, 30.0, 35.0, 27.0, 33.0, 47.0, 37.0, 36.0, 29.0, 42.0, 40.0, 41.0, 51.0, 34.0, 32.0, 35.0, 42.0, 51.0, 30.0, 30.0, 20.0, 24.0, 23.0, 26.0, 9.0, 9.0, 8.0, 10.0, 11.0, 11.0, 6.0, 5.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0021752940956503153, -0.0020960771944373846, -0.0020168600603938103, -0.0019376431591808796, -0.001858426141552627, -0.0017792091239243746, -0.001699992222711444, -0.0016207752050831914, -0.0015415581874549389, -0.0014623411698266864, -0.0013831241521984339, -0.0013039072509855032, -0.0012246902333572507, -0.0011454732157289982, -0.0010662563145160675, -0.000987039296887815, -0.0009078222792595625, -0.00082860526163131, -0.0007493883022107184, -0.0006701713427901268, -0.0005909543251618743, -0.0005117373075336218, -0.0004325203481130302, -0.0003533033886924386, -0.0002740863710641861, -0.00019486938253976405, -0.000115652394015342, -3.643540549091995e-05, 4.27815830335021e-05, 0.00012199857155792415, 0.0002012155600823462, 0.0002804325195029378, 0.00035964976996183395, 0.000438866758486256, 0.000518083747010678, 0.0005973007064312696, 0.0006765177240595222, 0.0007557347416877747, 0.0008349517011083663, 0.0009141686605289578, 0.0009933856781572104, 0.0010726026957854629, 0.0011518197134137154, 0.001231036614626646, 0.0013102536322548985, 0.001389470649883151, 0.0014686875510960817, 0.0015479045687243342, 0.0016271215863525867, 0.0017063386039808393, 0.0017855556216090918, 0.0018647725228220224, 0.001943989540450275, 0.0020232065580785275, 0.002102423459291458, 0.002181640360504389, 0.002260857494547963, 0.002340074395760894, 0.002419291529804468, 0.002498508431017399, 0.0025777253322303295, 0.002656942466273904, 0.0027361593674868345, 0.002815376501530409, 0.0028945934027433395]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 1.0, 3.0, 6.0, 4.0, 7.0, 7.0, 17.0, 28.0, 46.0, 45.0, 68.0, 117.0, 160.0, 251.0, 345.0, 494.0, 762.0, 1216.0, 1805.0, 2750.0, 4271.0, 6976.0, 11281.0, 19293.0, 32798.0, 60729.0, 120494.0, 232485.0, 253402.0, 138062.0, 69147.0, 36961.0, 20982.0, 12483.0, 7487.0, 4675.0, 3011.0, 1932.0, 1294.0, 862.0, 584.0, 405.0, 249.0, 177.0, 128.0, 68.0, 69.0, 37.0, 24.0, 27.0, 12.0, 9.0, 8.0, 4.0, 4.0, 1.0, 2.0, 2.0], "bins": [-0.00601959228515625, -0.005843043327331543, -0.005666494369506836, -0.005489945411682129, -0.005313396453857422, -0.005136847496032715, -0.004960298538208008, -0.004783749580383301, -0.004607200622558594, -0.004430651664733887, -0.00425410270690918, -0.004077553749084473, -0.0039010047912597656, -0.0037244558334350586, -0.0035479068756103516, -0.0033713579177856445, -0.0031948089599609375, -0.0030182600021362305, -0.0028417110443115234, -0.0026651620864868164, -0.0024886131286621094, -0.0023120641708374023, -0.0021355152130126953, -0.0019589662551879883, -0.0017824172973632812, -0.0016058683395385742, -0.0014293193817138672, -0.0012527704238891602, -0.0010762214660644531, -0.0008996725082397461, -0.0007231235504150391, -0.000546574592590332, -0.000370025634765625, -0.00019347667694091797, -1.6927719116210938e-05, 0.0001596212387084961, 0.0003361701965332031, 0.0005127191543579102, 0.0006892681121826172, 0.0008658170700073242, 0.0010423660278320312, 0.0012189149856567383, 0.0013954639434814453, 0.0015720129013061523, 0.0017485618591308594, 0.0019251108169555664, 0.0021016597747802734, 0.0022782087326049805, 0.0024547576904296875, 0.0026313066482543945, 0.0028078556060791016, 0.0029844045639038086, 0.0031609535217285156, 0.0033375024795532227, 0.0035140514373779297, 0.0036906003952026367, 0.0038671493530273438, 0.004043698310852051, 0.004220247268676758, 0.004396796226501465, 0.004573345184326172, 0.004749894142150879, 0.004926443099975586, 0.005102992057800293, 0.005279541015625]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 1.0, 6.0, 5.0, 11.0, 14.0, 9.0, 8.0, 18.0, 24.0, 18.0, 29.0, 28.0, 37.0, 33.0, 36.0, 47.0, 34.0, 41.0, 38.0, 42.0, 54.0, 34.0, 42.0, 36.0, 39.0, 47.0, 45.0, 39.0, 30.0, 22.0, 21.0, 20.0, 18.0, 11.0, 7.0, 8.0, 8.0, 9.0, 6.0, 7.0, 7.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.002002716064453125, -0.0019292235374450684, -0.0018557310104370117, -0.001782238483428955, -0.0017087459564208984, -0.0016352534294128418, -0.0015617609024047852, -0.0014882683753967285, -0.0014147758483886719, -0.0013412833213806152, -0.0012677907943725586, -0.001194298267364502, -0.0011208057403564453, -0.0010473132133483887, -0.000973820686340332, -0.0009003281593322754, -0.0008268356323242188, -0.0007533431053161621, -0.0006798505783081055, -0.0006063580513000488, -0.0005328655242919922, -0.00045937299728393555, -0.0003858804702758789, -0.00031238794326782227, -0.00023889541625976562, -0.00016540288925170898, -9.191036224365234e-05, -1.8417835235595703e-05, 5.507469177246094e-05, 0.00012856721878051758, 0.00020205974578857422, 0.00027555227279663086, 0.0003490447998046875, 0.00042253732681274414, 0.0004960298538208008, 0.0005695223808288574, 0.0006430149078369141, 0.0007165074348449707, 0.0007899999618530273, 0.000863492488861084, 0.0009369850158691406, 0.0010104775428771973, 0.001083970069885254, 0.0011574625968933105, 0.0012309551239013672, 0.0013044476509094238, 0.0013779401779174805, 0.0014514327049255371, 0.0015249252319335938, 0.0015984177589416504, 0.001671910285949707, 0.0017454028129577637, 0.0018188953399658203, 0.001892387866973877, 0.0019658803939819336, 0.0020393729209899902, 0.002112865447998047, 0.0021863579750061035, 0.00225985050201416, 0.002333343029022217, 0.0024068355560302734, 0.00248032808303833, 0.0025538206100463867, 0.0026273131370544434, 0.0027008056640625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 6.0, 2.0, 3.0, 4.0, 8.0, 7.0, 22.0, 28.0, 36.0, 56.0, 82.0, 133.0, 173.0, 271.0, 382.0, 512.0, 861.0, 1268.0, 2032.0, 3076.0, 4720.0, 7412.0, 12101.0, 20317.0, 34390.0, 60977.0, 110892.0, 200254.0, 244724.0, 149129.0, 81436.0, 45373.0, 26003.0, 15482.0, 9478.0, 5958.0, 3743.0, 2458.0, 1587.0, 1018.0, 696.0, 478.0, 304.0, 211.0, 146.0, 101.0, 62.0, 51.0, 33.0, 18.0, 22.0, 19.0, 4.0, 2.0, 4.0, 4.0, 0.0, 3.0], "bins": [-0.00550079345703125, -0.005340158939361572, -0.0051795244216918945, -0.005018889904022217, -0.004858255386352539, -0.004697620868682861, -0.004536986351013184, -0.004376351833343506, -0.004215717315673828, -0.00405508279800415, -0.0038944482803344727, -0.003733813762664795, -0.003573179244995117, -0.0034125447273254395, -0.0032519102096557617, -0.003091275691986084, -0.0029306411743164062, -0.0027700066566467285, -0.0026093721389770508, -0.002448737621307373, -0.0022881031036376953, -0.0021274685859680176, -0.00196683406829834, -0.0018061995506286621, -0.0016455650329589844, -0.0014849305152893066, -0.001324295997619629, -0.0011636614799499512, -0.0010030269622802734, -0.0008423924446105957, -0.000681757926940918, -0.0005211234092712402, -0.0003604888916015625, -0.00019985437393188477, -3.921985626220703e-05, 0.0001214146614074707, 0.00028204917907714844, 0.00044268369674682617, 0.0006033182144165039, 0.0007639527320861816, 0.0009245872497558594, 0.0010852217674255371, 0.0012458562850952148, 0.0014064908027648926, 0.0015671253204345703, 0.001727759838104248, 0.0018883943557739258, 0.0020490288734436035, 0.0022096633911132812, 0.002370297908782959, 0.0025309324264526367, 0.0026915669441223145, 0.002852201461791992, 0.00301283597946167, 0.0031734704971313477, 0.0033341050148010254, 0.003494739532470703, 0.003655374050140381, 0.0038160085678100586, 0.003976643085479736, 0.004137277603149414, 0.004297912120819092, 0.0044585466384887695, 0.004619181156158447, 0.004779815673828125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 6.0, 8.0, 5.0, 10.0, 9.0, 13.0, 12.0, 20.0, 9.0, 29.0, 26.0, 28.0, 29.0, 23.0, 33.0, 30.0, 43.0, 28.0, 34.0, 34.0, 30.0, 39.0, 46.0, 38.0, 47.0, 43.0, 35.0, 39.0, 30.0, 31.0, 31.0, 26.0, 19.0, 25.0, 12.0, 6.0, 13.0, 10.0, 9.0, 7.0, 4.0, 9.0, 4.0, 5.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0012674331665039062, -0.0012239068746566772, -0.0011803805828094482, -0.0011368542909622192, -0.0010933279991149902, -0.0010498017072677612, -0.0010062754154205322, -0.0009627491235733032, -0.0009192228317260742, -0.0008756965398788452, -0.0008321702480316162, -0.0007886439561843872, -0.0007451176643371582, -0.0007015913724899292, -0.0006580650806427002, -0.0006145387887954712, -0.0005710124969482422, -0.0005274862051010132, -0.0004839599132537842, -0.0004404336214065552, -0.00039690732955932617, -0.00035338103771209717, -0.00030985474586486816, -0.00026632845401763916, -0.00022280216217041016, -0.00017927587032318115, -0.00013574957847595215, -9.222328662872314e-05, -4.869699478149414e-05, -5.170702934265137e-06, 3.835558891296387e-05, 8.188188076019287e-05, 0.00012540817260742188, 0.00016893446445465088, 0.00021246075630187988, 0.0002559870481491089, 0.0002995133399963379, 0.0003430396318435669, 0.0003865659236907959, 0.0004300922155380249, 0.0004736185073852539, 0.0005171447992324829, 0.0005606710910797119, 0.0006041973829269409, 0.0006477236747741699, 0.0006912499666213989, 0.0007347762584686279, 0.0007783025503158569, 0.0008218288421630859, 0.0008653551340103149, 0.0009088814258575439, 0.000952407717704773, 0.000995934009552002, 0.001039460301399231, 0.00108298659324646, 0.001126512885093689, 0.001170039176940918, 0.001213565468788147, 0.001257091760635376, 0.001300618052482605, 0.001344144344329834, 0.001387670636177063, 0.001431196928024292, 0.001474723219871521, 0.00151824951171875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 10.0, 9.0, 15.0, 16.0, 11.0, 25.0, 31.0, 56.0, 85.0, 111.0, 165.0, 273.0, 339.0, 627.0, 861.0, 1250.0, 1878.0, 2790.0, 4317.0, 7396.0, 20100.0, 306395.0, 650729.0, 28659.0, 8378.0, 4642.0, 3121.0, 2025.0, 1417.0, 965.0, 629.0, 414.0, 245.0, 184.0, 89.0, 91.0, 42.0, 51.0, 28.0, 16.0, 11.0, 13.0, 8.0, 6.0, 6.0, 10.0, 9.0, 2.0, 0.0, 2.0], "bins": [-0.0013532638549804688, -0.001315772533416748, -0.0012782812118530273, -0.0012407898902893066, -0.001203298568725586, -0.0011658072471618652, -0.0011283159255981445, -0.0010908246040344238, -0.0010533332824707031, -0.0010158419609069824, -0.0009783506393432617, -0.000940859317779541, -0.0009033679962158203, -0.0008658766746520996, -0.0008283853530883789, -0.0007908940315246582, -0.0007534027099609375, -0.0007159113883972168, -0.0006784200668334961, -0.0006409287452697754, -0.0006034374237060547, -0.000565946102142334, -0.0005284547805786133, -0.0004909634590148926, -0.0004534721374511719, -0.00041598081588745117, -0.00037848949432373047, -0.00034099817276000977, -0.00030350685119628906, -0.00026601552963256836, -0.00022852420806884766, -0.00019103288650512695, -0.00015354156494140625, -0.00011605024337768555, -7.855892181396484e-05, -4.106760025024414e-05, -3.5762786865234375e-06, 3.3915042877197266e-05, 7.140636444091797e-05, 0.00010889768600463867, 0.00014638900756835938, 0.00018388032913208008, 0.00022137165069580078, 0.0002588629722595215, 0.0002963542938232422, 0.0003338456153869629, 0.0003713369369506836, 0.0004088282585144043, 0.000446319580078125, 0.0004838109016418457, 0.0005213022232055664, 0.0005587935447692871, 0.0005962848663330078, 0.0006337761878967285, 0.0006712675094604492, 0.0007087588310241699, 0.0007462501525878906, 0.0007837414741516113, 0.000821232795715332, 0.0008587241172790527, 0.0008962154388427734, 0.0009337067604064941, 0.0009711980819702148, 0.0010086894035339355, 0.0010461807250976562]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 9.0, 0.0, 0.0, 19.0, 0.0, 0.0, 33.0, 0.0, 0.0, 72.0, 0.0, 106.0, 0.0, 0.0, 157.0, 0.0, 0.0, 203.0, 0.0, 0.0, 183.0, 0.0, 100.0, 0.0, 0.0, 63.0, 0.0, 0.0, 26.0, 0.0, 0.0, 23.0, 0.0, 0.0, 11.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.152557373046875e-07, -6.938353180885315e-07, -6.724148988723755e-07, -6.509944796562195e-07, -6.295740604400635e-07, -6.081536412239075e-07, -5.867332220077515e-07, -5.653128027915955e-07, -5.438923835754395e-07, -5.224719643592834e-07, -5.010515451431274e-07, -4.796311259269714e-07, -4.5821070671081543e-07, -4.367902874946594e-07, -4.153698682785034e-07, -3.939494490623474e-07, -3.725290298461914e-07, -3.511086106300354e-07, -3.296881914138794e-07, -3.082677721977234e-07, -2.868473529815674e-07, -2.654269337654114e-07, -2.4400651454925537e-07, -2.2258609533309937e-07, -2.0116567611694336e-07, -1.7974525690078735e-07, -1.5832483768463135e-07, -1.3690441846847534e-07, -1.1548399925231934e-07, -9.406358003616333e-08, -7.264316082000732e-08, -5.122274160385132e-08, -2.9802322387695312e-08, -8.381903171539307e-09, 1.30385160446167e-08, 3.4458935260772705e-08, 5.587935447692871e-08, 7.729977369308472e-08, 9.872019290924072e-08, 1.2014061212539673e-07, 1.4156103134155273e-07, 1.6298145055770874e-07, 1.8440186977386475e-07, 2.0582228899002075e-07, 2.2724270820617676e-07, 2.4866312742233276e-07, 2.7008354663848877e-07, 2.915039658546448e-07, 3.129243850708008e-07, 3.343448042869568e-07, 3.557652235031128e-07, 3.771856427192688e-07, 3.986060619354248e-07, 4.200264811515808e-07, 4.414469003677368e-07, 4.628673195838928e-07, 4.842877388000488e-07, 5.057081580162048e-07, 5.271285772323608e-07, 5.485489964485168e-07, 5.699694156646729e-07, 5.913898348808289e-07, 6.128102540969849e-07, 6.342306733131409e-07, 6.556510925292969e-07]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 8.0, 11.0, 14.0, 21.0, 27.0, 31.0, 53.0, 69.0, 71.0, 130.0, 170.0, 205.0, 290.0, 407.0, 486.0, 655.0, 881.0, 1214.0, 1896.0, 3107.0, 6119.0, 20806.0, 957728.0, 36597.0, 7012.0, 3455.0, 2058.0, 1239.0, 967.0, 664.0, 520.0, 414.0, 308.0, 219.0, 182.0, 139.0, 100.0, 79.0, 55.0, 40.0, 28.0, 24.0, 17.0, 14.0, 3.0, 3.0, 7.0, 6.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.002742767333984375, -0.0026559531688690186, -0.002569139003753662, -0.0024823248386383057, -0.0023955106735229492, -0.0023086965084075928, -0.0022218823432922363, -0.00213506817817688, -0.0020482540130615234, -0.001961439847946167, -0.0018746256828308105, -0.001787811517715454, -0.0017009973526000977, -0.0016141831874847412, -0.0015273690223693848, -0.0014405548572540283, -0.0013537406921386719, -0.0012669265270233154, -0.001180112361907959, -0.0010932981967926025, -0.001006484031677246, -0.0009196698665618896, -0.0008328557014465332, -0.0007460415363311768, -0.0006592273712158203, -0.0005724132061004639, -0.0004855990409851074, -0.000398784875869751, -0.00031197071075439453, -0.00022515654563903809, -0.00013834238052368164, -5.1528215408325195e-05, 3.528594970703125e-05, 0.0001221001148223877, 0.00020891427993774414, 0.0002957284450531006, 0.00038254261016845703, 0.0004693567752838135, 0.0005561709403991699, 0.0006429851055145264, 0.0007297992706298828, 0.0008166134357452393, 0.0009034276008605957, 0.0009902417659759521, 0.0010770559310913086, 0.001163870096206665, 0.0012506842613220215, 0.001337498426437378, 0.0014243125915527344, 0.0015111267566680908, 0.0015979409217834473, 0.0016847550868988037, 0.0017715692520141602, 0.0018583834171295166, 0.001945197582244873, 0.0020320117473602295, 0.002118825912475586, 0.0022056400775909424, 0.002292454242706299, 0.0023792684078216553, 0.0024660825729370117, 0.002552896738052368, 0.0026397109031677246, 0.002726525068283081, 0.0028133392333984375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 4.0, 4.0, 34.0, 192.0, 510.0, 176.0, 30.0, 9.0, 3.0, 6.0, 5.0, 4.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006208419799804688, -0.0005990341305732727, -0.0005772262811660767, -0.0005554184317588806, -0.0005336105823516846, -0.0005118027329444885, -0.0004899948835372925, -0.00046818703413009644, -0.0004463791847229004, -0.00042457133531570435, -0.0004027634859085083, -0.00038095563650131226, -0.0003591477870941162, -0.00033733993768692017, -0.0003155320882797241, -0.0002937242388725281, -0.00027191638946533203, -0.000250108540058136, -0.00022830069065093994, -0.0002064928412437439, -0.00018468499183654785, -0.0001628771424293518, -0.00014106929302215576, -0.00011926144361495972, -9.745359420776367e-05, -7.564574480056763e-05, -5.383789539337158e-05, -3.203004598617554e-05, -1.0222196578979492e-05, 1.1585652828216553e-05, 3.33935022354126e-05, 5.520135164260864e-05, 7.700920104980469e-05, 9.881705045700073e-05, 0.00012062489986419678, 0.00014243274927139282, 0.00016424059867858887, 0.0001860484480857849, 0.00020785629749298096, 0.000229664146900177, 0.00025147199630737305, 0.0002732798457145691, 0.00029508769512176514, 0.0003168955445289612, 0.0003387033939361572, 0.00036051124334335327, 0.0003823190927505493, 0.00040412694215774536, 0.0004259347915649414, 0.00044774264097213745, 0.0004695504903793335, 0.0004913583397865295, 0.0005131661891937256, 0.0005349740386009216, 0.0005567818880081177, 0.0005785897374153137, 0.0006003975868225098, 0.0006222054362297058, 0.0006440132856369019, 0.0006658211350440979, 0.0006876289844512939, 0.00070943683385849, 0.000731244683265686, 0.0007530525326728821, 0.0007748603820800781]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 5.0, 5.0, 3.0, 6.0, 15.0, 16.0, 11.0, 20.0, 18.0, 36.0, 47.0, 66.0, 79.0, 89.0, 96.0, 104.0, 75.0, 61.0, 65.0, 34.0, 31.0, 28.0, 18.0, 20.0, 13.0, 9.0, 5.0, 5.0, 4.0, 3.0, 6.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003143907990306616, -0.0030275105964392424, -0.002911113202571869, -0.0027947158087044954, -0.002678318414837122, -0.0025619210209697485, -0.002445523627102375, -0.0023291262332350016, -0.002212728839367628, -0.0020963314455002546, -0.001979934051632881, -0.0018635366577655077, -0.0017471392638981342, -0.0016307418700307608, -0.0015143444761633873, -0.0013979470822960138, -0.0012815495720133185, -0.001165152178145945, -0.0010487547842785716, -0.0009323573904111981, -0.0008159599965438247, -0.0006995625444687903, -0.0005831651506014168, -0.00046676775673404336, -0.0003503703628666699, -0.00023397296899929643, -0.00011757556058000773, -1.178152160719037e-06, 0.00011521924170665443, 0.00023161666467785835, 0.0003480140585452318, 0.0004644114524126053, 0.0005808088462799788, 0.0006972062401473522, 0.0008136036340147257, 0.0009300010278820992, 0.0010463984217494726, 0.001162795815616846, 0.0012791932094842196, 0.001395590603351593, 0.0015119879972189665, 0.00162838539108634, 0.0017447827849537134, 0.0018611801788210869, 0.0019775775726884604, 0.002093974966555834, 0.0022103723604232073, 0.0023267697542905807, 0.002443167380988598, 0.0025595647748559713, 0.002675962168723345, 0.0027923595625907183, 0.0029087569564580917, 0.003025154350325465, 0.0031415517441928387, 0.003257949138060212, 0.0033743465319275856, 0.003490743925794959, 0.0036071413196623325, 0.003723538713529706, 0.0038399361073970795, 0.003956333734095097, 0.004072730895131826, 0.0041891285218298435, 0.004305525682866573]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 0.0, 1.0, 6.0, 9.0, 4.0, 12.0, 14.0, 12.0, 16.0, 20.0, 17.0, 20.0, 40.0, 21.0, 36.0, 32.0, 45.0, 37.0, 49.0, 42.0, 40.0, 38.0, 39.0, 43.0, 47.0, 40.0, 38.0, 42.0, 31.0, 29.0, 28.0, 21.0, 21.0, 18.0, 16.0, 16.0, 17.0, 13.0, 8.0, 9.0, 4.0, 6.0, 5.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.002348981099203229, -0.002270263386890292, -0.0021915454417467117, -0.002112827729433775, -0.0020341097842901945, -0.0019553920719772577, -0.0018766741268336773, -0.0017979564145207405, -0.00171923846937716, -0.0016405206406489015, -0.0015618028119206429, -0.0014830849831923842, -0.0014043671544641256, -0.001325649325735867, -0.0012469314970076084, -0.0011682137846946716, -0.001089495955966413, -0.0010107781272381544, -0.0009320602985098958, -0.0008533424697816372, -0.0007746246410533786, -0.00069590681232512, -0.0006171890418045223, -0.0005384712130762637, -0.00045975338434800506, -0.00038103555561974645, -0.00030231772689148784, -0.00022359992726705968, -0.00014488209853880107, -6.616426981054246e-05, 1.2553529813885689e-05, 9.12713585421443e-05, 0.0001699891872704029, 0.0002487070159986615, 0.00032742484472692013, 0.0004061426443513483, 0.0004848604730796069, 0.000563578330911696, 0.0006422961014322937, 0.0007210139301605523, 0.0007997317588888109, 0.0008784495876170695, 0.0009571674163453281, 0.0010358851868659258, 0.0011146030155941844, 0.001193320844322443, 0.0012720386730507016, 0.0013507565017789602, 0.0014294743305072188, 0.0015081921592354774, 0.001586909987963736, 0.0016656278166919947, 0.0017443456454202533, 0.0018230634741485119, 0.0019017811864614487, 0.001980499131605029, 0.002059216843917966, 0.0021379345562309027, 0.002216652501374483, 0.00229537021368742, 0.0023740881588310003, 0.002452805871143937, 0.0025315238162875175, 0.0026102415286004543, 0.0026889594737440348]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 7.0, 4.0, 13.0, 18.0, 13.0, 18.0, 35.0, 41.0, 84.0, 98.0, 142.0, 183.0, 267.0, 366.0, 514.0, 782.0, 1139.0, 1640.0, 2397.0, 3643.0, 5756.0, 9141.0, 15270.0, 26285.0, 50005.0, 105232.0, 279635.0, 1010918.0, 1779008.0, 561718.0, 171850.0, 73566.0, 37602.0, 21022.0, 12311.0, 7886.0, 4926.0, 3342.0, 2276.0, 1565.0, 1025.0, 747.0, 524.0, 367.0, 273.0, 200.0, 115.0, 96.0, 57.0, 61.0, 35.0, 24.0, 17.0, 15.0, 7.0, 7.0, 4.0, 2.0, 3.0, 3.0], "bins": [-0.004299163818359375, -0.004166007041931152, -0.00403285026550293, -0.003899693489074707, -0.0037665367126464844, -0.0036333799362182617, -0.003500223159790039, -0.0033670663833618164, -0.0032339096069335938, -0.003100752830505371, -0.0029675960540771484, -0.0028344392776489258, -0.002701282501220703, -0.0025681257247924805, -0.002434968948364258, -0.002301812171936035, -0.0021686553955078125, -0.00203549861907959, -0.0019023418426513672, -0.0017691850662231445, -0.0016360282897949219, -0.0015028715133666992, -0.0013697147369384766, -0.001236557960510254, -0.0011034011840820312, -0.0009702444076538086, -0.0008370876312255859, -0.0007039308547973633, -0.0005707740783691406, -0.00043761730194091797, -0.0003044605255126953, -0.00017130374908447266, -3.814697265625e-05, 9.500980377197266e-05, 0.0002281665802001953, 0.00036132335662841797, 0.0004944801330566406, 0.0006276369094848633, 0.0007607936859130859, 0.0008939504623413086, 0.0010271072387695312, 0.001160264015197754, 0.0012934207916259766, 0.0014265775680541992, 0.0015597343444824219, 0.0016928911209106445, 0.0018260478973388672, 0.00195920467376709, 0.0020923614501953125, 0.002225518226623535, 0.002358675003051758, 0.0024918317794799805, 0.002624988555908203, 0.0027581453323364258, 0.0028913021087646484, 0.003024458885192871, 0.0031576156616210938, 0.0032907724380493164, 0.003423929214477539, 0.0035570859909057617, 0.0036902427673339844, 0.003823399543762207, 0.00395655632019043, 0.004089713096618652, 0.004222869873046875]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 4.0, 6.0, 4.0, 5.0, 6.0, 21.0, 9.0, 13.0, 20.0, 22.0, 33.0, 20.0, 32.0, 32.0, 29.0, 43.0, 48.0, 57.0, 38.0, 45.0, 43.0, 36.0, 47.0, 55.0, 41.0, 33.0, 31.0, 37.0, 24.0, 30.0, 16.0, 20.0, 19.0, 16.0, 5.0, 16.0, 14.0, 4.0, 6.0, 5.0, 5.0, 6.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018520355224609375, -0.0017892122268676758, -0.001726388931274414, -0.0016635656356811523, -0.0016007423400878906, -0.001537919044494629, -0.0014750957489013672, -0.0014122724533081055, -0.0013494491577148438, -0.001286625862121582, -0.0012238025665283203, -0.0011609792709350586, -0.0010981559753417969, -0.0010353326797485352, -0.0009725093841552734, -0.0009096860885620117, -0.00084686279296875, -0.0007840394973754883, -0.0007212162017822266, -0.0006583929061889648, -0.0005955696105957031, -0.0005327463150024414, -0.0004699230194091797, -0.00040709972381591797, -0.00034427642822265625, -0.00028145313262939453, -0.0002186298370361328, -0.0001558065414428711, -9.298324584960938e-05, -3.0159950256347656e-05, 3.266334533691406e-05, 9.548664093017578e-05, 0.0001583099365234375, 0.00022113323211669922, 0.00028395652770996094, 0.00034677982330322266, 0.0004096031188964844, 0.0004724264144897461, 0.0005352497100830078, 0.0005980730056762695, 0.0006608963012695312, 0.000723719596862793, 0.0007865428924560547, 0.0008493661880493164, 0.0009121894836425781, 0.0009750127792358398, 0.0010378360748291016, 0.0011006593704223633, 0.001163482666015625, 0.0012263059616088867, 0.0012891292572021484, 0.0013519525527954102, 0.0014147758483886719, 0.0014775991439819336, 0.0015404224395751953, 0.001603245735168457, 0.0016660690307617188, 0.0017288923263549805, 0.0017917156219482422, 0.001854538917541504, 0.0019173622131347656, 0.0019801855087280273, 0.002043008804321289, 0.0021058320999145508, 0.0021686553955078125]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 6.0, 7.0, 10.0, 14.0, 25.0, 44.0, 42.0, 78.0, 94.0, 155.0, 182.0, 276.0, 406.0, 581.0, 867.0, 1216.0, 1730.0, 2620.0, 4012.0, 6278.0, 10109.0, 16459.0, 27944.0, 48666.0, 91149.0, 184500.0, 424497.0, 1217515.0, 1293230.0, 448317.0, 192914.0, 94522.0, 50810.0, 28726.0, 16625.0, 10209.0, 6533.0, 4247.0, 2779.0, 1856.0, 1227.0, 880.0, 575.0, 394.0, 267.0, 191.0, 154.0, 105.0, 72.0, 53.0, 47.0, 26.0, 17.0, 14.0, 17.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.003566741943359375, -0.003451794385910034, -0.0033368468284606934, -0.0032218992710113525, -0.0031069517135620117, -0.002992004156112671, -0.00287705659866333, -0.0027621090412139893, -0.0026471614837646484, -0.0025322139263153076, -0.002417266368865967, -0.002302318811416626, -0.002187371253967285, -0.0020724236965179443, -0.0019574761390686035, -0.0018425285816192627, -0.0017275810241699219, -0.001612633466720581, -0.0014976859092712402, -0.0013827383518218994, -0.0012677907943725586, -0.0011528432369232178, -0.001037895679473877, -0.0009229481220245361, -0.0008080005645751953, -0.0006930530071258545, -0.0005781054496765137, -0.00046315789222717285, -0.00034821033477783203, -0.0002332627773284912, -0.00011831521987915039, -3.3676624298095703e-06, 0.00011157989501953125, 0.00022652745246887207, 0.0003414750099182129, 0.0004564225673675537, 0.0005713701248168945, 0.0006863176822662354, 0.0008012652397155762, 0.000916212797164917, 0.0010311603546142578, 0.0011461079120635986, 0.0012610554695129395, 0.0013760030269622803, 0.001490950584411621, 0.001605898141860962, 0.0017208456993103027, 0.0018357932567596436, 0.0019507408142089844, 0.002065688371658325, 0.002180635929107666, 0.002295583486557007, 0.0024105310440063477, 0.0025254786014556885, 0.0026404261589050293, 0.00275537371635437, 0.002870321273803711, 0.0029852688312530518, 0.0031002163887023926, 0.0032151639461517334, 0.0033301115036010742, 0.003445059061050415, 0.003560006618499756, 0.0036749541759490967, 0.0037899017333984375]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 4.0, 3.0, 10.0, 6.0, 10.0, 8.0, 15.0, 19.0, 17.0, 27.0, 24.0, 35.0, 61.0, 52.0, 88.0, 79.0, 121.0, 127.0, 173.0, 204.0, 250.0, 305.0, 377.0, 358.0, 298.0, 234.0, 211.0, 184.0, 132.0, 103.0, 105.0, 90.0, 51.0, 54.0, 49.0, 42.0, 25.0, 28.0, 24.0, 21.0, 9.0, 9.0, 6.0, 6.0, 6.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0011205673217773438, -0.001086696982383728, -0.0010528266429901123, -0.0010189563035964966, -0.0009850859642028809, -0.0009512156248092651, -0.0009173452854156494, -0.0008834749460220337, -0.000849604606628418, -0.0008157342672348022, -0.0007818639278411865, -0.0007479935884475708, -0.0007141232490539551, -0.0006802529096603394, -0.0006463825702667236, -0.0006125122308731079, -0.0005786418914794922, -0.0005447715520858765, -0.0005109012126922607, -0.000477030873298645, -0.0004431605339050293, -0.0004092901945114136, -0.00037541985511779785, -0.00034154951572418213, -0.0003076791763305664, -0.0002738088369369507, -0.00023993849754333496, -0.00020606815814971924, -0.00017219781875610352, -0.0001383274793624878, -0.00010445713996887207, -7.058680057525635e-05, -3.6716461181640625e-05, -2.8461217880249023e-06, 3.102421760559082e-05, 6.489455699920654e-05, 9.876489639282227e-05, 0.000132635235786438, 0.0001665055751800537, 0.00020037591457366943, 0.00023424625396728516, 0.0002681165933609009, 0.0003019869327545166, 0.0003358572721481323, 0.00036972761154174805, 0.00040359795093536377, 0.0004374682903289795, 0.0004713386297225952, 0.0005052089691162109, 0.0005390793085098267, 0.0005729496479034424, 0.0006068199872970581, 0.0006406903266906738, 0.0006745606660842896, 0.0007084310054779053, 0.000742301344871521, 0.0007761716842651367, 0.0008100420236587524, 0.0008439123630523682, 0.0008777827024459839, 0.0009116530418395996, 0.0009455233812332153, 0.000979393720626831, 0.0010132640600204468, 0.0010471343994140625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 7.0, 8.0, 1.0, 7.0, 14.0, 12.0, 26.0, 16.0, 21.0, 19.0, 35.0, 27.0, 43.0, 66.0, 63.0, 79.0, 69.0, 63.0, 71.0, 82.0, 50.0, 41.0, 37.0, 19.0, 17.0, 20.0, 18.0, 14.0, 12.0, 5.0, 6.0, 7.0, 4.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028761287685483694, -0.0027792067267000675, -0.002682284452021122, -0.00258536241017282, -0.002488440368324518, -0.0023915180936455727, -0.0022945960517972708, -0.002197674009948969, -0.0021007517352700233, -0.0020038296934217215, -0.001906907418742776, -0.001809985376894474, -0.0017130632186308503, -0.0016161410603672266, -0.0015192190185189247, -0.001422296860255301, -0.0013253747019916773, -0.0012284525437280536, -0.0011315303854644299, -0.001034608343616128, -0.0009376861853525043, -0.0008407640270888805, -0.0007438419270329177, -0.0006469198269769549, -0.0005499976687133312, -0.00045307553955353796, -0.0003561534103937447, -0.00025923128123395145, -0.0001623091520741582, -6.538702291436493e-05, 3.1535106245428324e-05, 0.00012845720630139112, 0.00022537913173437119, 0.00032230126089416444, 0.0004192233900539577, 0.0005161454901099205, 0.0006130676483735442, 0.0007099898066371679, 0.0008069119066931307, 0.0009038340067490935, 0.0010007561650127172, 0.001097678323276341, 0.0011946004815399647, 0.0012915225233882666, 0.0013884446816518903, 0.001485366839915514, 0.0015822888817638159, 0.0016792110400274396, 0.0017761331982910633, 0.001873055356554687, 0.0019699775148183107, 0.0020668995566666126, 0.002163821831345558, 0.00226074387319386, 0.002357665915042162, 0.0024545881897211075, 0.0025515102315694094, 0.0026484322734177113, 0.002745354548096657, 0.0028422765899449587, 0.0029391986317932606, 0.003036120906472206, 0.003133042948320508, 0.00322996499016881, 0.0033268872648477554]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 8.0, 6.0, 7.0, 8.0, 14.0, 18.0, 11.0, 10.0, 20.0, 31.0, 20.0, 26.0, 26.0, 31.0, 37.0, 41.0, 32.0, 34.0, 48.0, 32.0, 43.0, 34.0, 45.0, 40.0, 47.0, 38.0, 37.0, 35.0, 31.0, 21.0, 23.0, 21.0, 20.0, 11.0, 19.0, 10.0, 14.0, 11.0, 7.0, 7.0, 9.0, 8.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0019662862177938223, -0.0019031199626624584, -0.0018399538239464164, -0.0017767875688150525, -0.0017136214300990105, -0.0016504551749676466, -0.0015872889198362827, -0.0015241226647049189, -0.0014609565259888768, -0.001397790270857513, -0.001334624132141471, -0.001271457877010107, -0.0012082916218787432, -0.0011451254831627011, -0.0010819592280313373, -0.0010187930893152952, -0.0009556268341839314, -0.0008924606372602284, -0.0008292944403365254, -0.0007661281852051616, -0.0007029619882814586, -0.0006397957913577557, -0.0005766295362263918, -0.0005134633393026888, -0.0004502971423789859, -0.0003871309454552829, -0.0003239647194277495, -0.0002607984934002161, -0.00019763229647651315, -0.0001344660995528102, -7.129987352527678e-05, -8.133647497743368e-06, 5.503278225660324e-05, 0.00011819899373222142, 0.0001813652052078396, 0.000244531431235373, 0.000307697628159076, 0.00037086382508277893, 0.00043403005111031234, 0.0004971962771378458, 0.0005603624740615487, 0.0006235286709852517, 0.0006866948679089546, 0.0007498611230403185, 0.0008130273199640214, 0.0008761935168877244, 0.0009393597720190883, 0.0010025259107351303, 0.0010656921658664942, 0.001128858420997858, 0.0011920245597139, 0.001255190814845264, 0.001318356953561306, 0.0013815232086926699, 0.0014446894638240337, 0.0015078557189553976, 0.0015710218576714396, 0.0016341881128028035, 0.0016973542515188456, 0.0017605205066502094, 0.0018236867617815733, 0.0018868529004976153, 0.0019500191556289792, 0.0020131852943450212, 0.002076351549476385]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 2.0, 6.0, 10.0, 15.0, 19.0, 29.0, 27.0, 53.0, 77.0, 126.0, 165.0, 248.0, 403.0, 570.0, 970.0, 1295.0, 2086.0, 3167.0, 4922.0, 8033.0, 13012.0, 22004.0, 38859.0, 75091.0, 162110.0, 333294.0, 190741.0, 84737.0, 43815.0, 24121.0, 14453.0, 8727.0, 5308.0, 3502.0, 2230.0, 1487.0, 974.0, 584.0, 394.0, 287.0, 218.0, 129.0, 88.0, 62.0, 36.0, 25.0, 16.0, 13.0, 10.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00139617919921875, -0.001353338360786438, -0.001310497522354126, -0.001267656683921814, -0.001224815845489502, -0.00118197500705719, -0.001139134168624878, -0.001096293330192566, -0.001053452491760254, -0.001010611653327942, -0.0009677708148956299, -0.0009249299764633179, -0.0008820891380310059, -0.0008392482995986938, -0.0007964074611663818, -0.0007535666227340698, -0.0007107257843017578, -0.0006678849458694458, -0.0006250441074371338, -0.0005822032690048218, -0.0005393624305725098, -0.0004965215921401978, -0.00045368075370788574, -0.00041083991527557373, -0.0003679990768432617, -0.0003251582384109497, -0.0002823173999786377, -0.00023947656154632568, -0.00019663572311401367, -0.00015379488468170166, -0.00011095404624938965, -6.811320781707764e-05, -2.5272369384765625e-05, 1.7568469047546387e-05, 6.04093074798584e-05, 0.00010325014591217041, 0.00014609098434448242, 0.00018893182277679443, 0.00023177266120910645, 0.00027461349964141846, 0.00031745433807373047, 0.0003602951765060425, 0.0004031360149383545, 0.0004459768533706665, 0.0004888176918029785, 0.0005316585302352905, 0.0005744993686676025, 0.0006173402070999146, 0.0006601810455322266, 0.0007030218839645386, 0.0007458627223968506, 0.0007887035608291626, 0.0008315443992614746, 0.0008743852376937866, 0.0009172260761260986, 0.0009600669145584106, 0.0010029077529907227, 0.0010457485914230347, 0.0010885894298553467, 0.0011314302682876587, 0.0011742711067199707, 0.0012171119451522827, 0.0012599527835845947, 0.0013027936220169067, 0.0013456344604492188]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 9.0, 9.0, 6.0, 11.0, 11.0, 13.0, 14.0, 8.0, 19.0, 25.0, 23.0, 27.0, 31.0, 26.0, 40.0, 38.0, 42.0, 47.0, 38.0, 41.0, 43.0, 38.0, 41.0, 40.0, 48.0, 46.0, 35.0, 38.0, 30.0, 15.0, 24.0, 14.0, 14.0, 12.0, 21.0, 8.0, 6.0, 10.0, 10.0, 9.0, 8.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0021457672119140625, -0.002077460289001465, -0.002009153366088867, -0.0019408464431762695, -0.0018725395202636719, -0.0018042325973510742, -0.0017359256744384766, -0.001667618751525879, -0.0015993118286132812, -0.0015310049057006836, -0.001462697982788086, -0.0013943910598754883, -0.0013260841369628906, -0.001257777214050293, -0.0011894702911376953, -0.0011211633682250977, -0.0010528564453125, -0.0009845495223999023, -0.0009162425994873047, -0.000847935676574707, -0.0007796287536621094, -0.0007113218307495117, -0.0006430149078369141, -0.0005747079849243164, -0.0005064010620117188, -0.0004380941390991211, -0.00036978721618652344, -0.0003014802932739258, -0.00023317337036132812, -0.00016486644744873047, -9.655952453613281e-05, -2.8252601623535156e-05, 4.00543212890625e-05, 0.00010836124420166016, 0.0001766681671142578, 0.00024497509002685547, 0.0003132820129394531, 0.0003815889358520508, 0.00044989585876464844, 0.0005182027816772461, 0.0005865097045898438, 0.0006548166275024414, 0.0007231235504150391, 0.0007914304733276367, 0.0008597373962402344, 0.000928044319152832, 0.0009963512420654297, 0.0010646581649780273, 0.001132965087890625, 0.0012012720108032227, 0.0012695789337158203, 0.001337885856628418, 0.0014061927795410156, 0.0014744997024536133, 0.001542806625366211, 0.0016111135482788086, 0.0016794204711914062, 0.001747727394104004, 0.0018160343170166016, 0.0018843412399291992, 0.0019526481628417969, 0.0020209550857543945, 0.002089262008666992, 0.00215756893157959, 0.0022258758544921875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 8.0, 11.0, 20.0, 15.0, 18.0, 32.0, 45.0, 96.0, 155.0, 266.0, 377.0, 647.0, 1137.0, 1830.0, 3178.0, 5818.0, 10603.0, 22498.0, 54885.0, 193711.0, 531627.0, 137594.0, 43756.0, 18790.0, 9290.0, 4939.0, 2866.0, 1586.0, 1088.0, 627.0, 372.0, 233.0, 146.0, 76.0, 75.0, 49.0, 27.0, 13.0, 13.0, 11.0, 11.0, 7.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0017061233520507812, -0.0016438215970993042, -0.0015815198421478271, -0.00151921808719635, -0.001456916332244873, -0.001394614577293396, -0.001332312822341919, -0.001270011067390442, -0.0012077093124389648, -0.0011454075574874878, -0.0010831058025360107, -0.0010208040475845337, -0.0009585022926330566, -0.0008962005376815796, -0.0008338987827301025, -0.0007715970277786255, -0.0007092952728271484, -0.0006469935178756714, -0.0005846917629241943, -0.0005223900079727173, -0.00046008825302124023, -0.0003977864980697632, -0.00033548474311828613, -0.0002731829881668091, -0.00021088123321533203, -0.00014857947826385498, -8.627772331237793e-05, -2.397596836090088e-05, 3.832578659057617e-05, 0.00010062754154205322, 0.00016292929649353027, 0.00022523105144500732, 0.0002875328063964844, 0.0003498345613479614, 0.0004121363162994385, 0.00047443807125091553, 0.0005367398262023926, 0.0005990415811538696, 0.0006613433361053467, 0.0007236450910568237, 0.0007859468460083008, 0.0008482486009597778, 0.0009105503559112549, 0.0009728521108627319, 0.001035153865814209, 0.001097455620765686, 0.001159757375717163, 0.0012220591306686401, 0.0012843608856201172, 0.0013466626405715942, 0.0014089643955230713, 0.0014712661504745483, 0.0015335679054260254, 0.0015958696603775024, 0.0016581714153289795, 0.0017204731702804565, 0.0017827749252319336, 0.0018450766801834106, 0.0019073784351348877, 0.0019696801900863647, 0.002031981945037842, 0.002094283699989319, 0.002156585454940796, 0.002218887209892273, 0.00228118896484375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 6.0, 5.0, 8.0, 8.0, 5.0, 15.0, 10.0, 16.0, 13.0, 24.0, 31.0, 28.0, 17.0, 31.0, 27.0, 46.0, 33.0, 36.0, 34.0, 32.0, 32.0, 38.0, 38.0, 46.0, 33.0, 36.0, 29.0, 42.0, 26.0, 37.0, 26.0, 24.0, 25.0, 12.0, 19.0, 10.0, 7.0, 22.0, 11.0, 14.0, 8.0, 7.0, 11.0, 4.0, 7.0, 7.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0012388229370117188, -0.001199290156364441, -0.001159757375717163, -0.0011202245950698853, -0.0010806918144226074, -0.0010411590337753296, -0.0010016262531280518, -0.0009620934724807739, -0.0009225606918334961, -0.0008830279111862183, -0.0008434951305389404, -0.0008039623498916626, -0.0007644295692443848, -0.0007248967885971069, -0.0006853640079498291, -0.0006458312273025513, -0.0006062984466552734, -0.0005667656660079956, -0.0005272328853607178, -0.00048770010471343994, -0.0004481673240661621, -0.0004086345434188843, -0.00036910176277160645, -0.0003295689821243286, -0.0002900362014770508, -0.00025050342082977295, -0.00021097064018249512, -0.00017143785953521729, -0.00013190507888793945, -9.237229824066162e-05, -5.283951759338379e-05, -1.3306736946105957e-05, 2.6226043701171875e-05, 6.575882434844971e-05, 0.00010529160499572754, 0.00014482438564300537, 0.0001843571662902832, 0.00022388994693756104, 0.00026342272758483887, 0.0003029555082321167, 0.00034248828887939453, 0.00038202106952667236, 0.0004215538501739502, 0.00046108663082122803, 0.0005006194114685059, 0.0005401521921157837, 0.0005796849727630615, 0.0006192177534103394, 0.0006587505340576172, 0.000698283314704895, 0.0007378160953521729, 0.0007773488759994507, 0.0008168816566467285, 0.0008564144372940063, 0.0008959472179412842, 0.000935479998588562, 0.0009750127792358398, 0.0010145455598831177, 0.0010540783405303955, 0.0010936111211776733, 0.0011331439018249512, 0.001172676682472229, 0.0012122094631195068, 0.0012517422437667847, 0.0012912750244140625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 7.0, 7.0, 11.0, 14.0, 16.0, 24.0, 36.0, 46.0, 47.0, 78.0, 79.0, 101.0, 123.0, 187.0, 244.0, 397.0, 595.0, 912.0, 1714.0, 3854.0, 14039.0, 123109.0, 851077.0, 38281.0, 7244.0, 2609.0, 1253.0, 733.0, 501.0, 316.0, 195.0, 156.0, 102.0, 100.0, 55.0, 62.0, 41.0, 43.0, 32.0, 26.0, 19.0, 19.0, 16.0, 6.0, 10.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0], "bins": [-0.0004172325134277344, -0.00040505826473236084, -0.0003928840160369873, -0.00038070976734161377, -0.00036853551864624023, -0.0003563612699508667, -0.00034418702125549316, -0.00033201277256011963, -0.0003198385238647461, -0.00030766427516937256, -0.000295490026473999, -0.0002833157777786255, -0.00027114152908325195, -0.0002589672803878784, -0.0002467930316925049, -0.00023461878299713135, -0.0002224445343017578, -0.00021027028560638428, -0.00019809603691101074, -0.0001859217882156372, -0.00017374753952026367, -0.00016157329082489014, -0.0001493990421295166, -0.00013722479343414307, -0.00012505054473876953, -0.000112876296043396, -0.00010070204734802246, -8.852779865264893e-05, -7.635354995727539e-05, -6.417930126190186e-05, -5.200505256652832e-05, -3.9830803871154785e-05, -2.765655517578125e-05, -1.5482306480407715e-05, -3.3080577850341797e-06, 8.866190910339355e-06, 2.104043960571289e-05, 3.3214688301086426e-05, 4.538893699645996e-05, 5.7563185691833496e-05, 6.973743438720703e-05, 8.191168308258057e-05, 9.40859317779541e-05, 0.00010626018047332764, 0.00011843442916870117, 0.0001306086778640747, 0.00014278292655944824, 0.00015495717525482178, 0.0001671314239501953, 0.00017930567264556885, 0.00019147992134094238, 0.00020365417003631592, 0.00021582841873168945, 0.000228002667427063, 0.00024017691612243652, 0.00025235116481781006, 0.0002645254135131836, 0.00027669966220855713, 0.00028887391090393066, 0.0003010481595993042, 0.00031322240829467773, 0.00032539665699005127, 0.0003375709056854248, 0.00034974515438079834, 0.0003619194030761719]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 5.0, 9.0, 8.0, 19.0, 16.0, 0.0, 24.0, 17.0, 29.0, 33.0, 40.0, 53.0, 52.0, 0.0, 90.0, 65.0, 55.0, 77.0, 74.0, 68.0, 59.0, 0.0, 37.0, 34.0, 31.0, 27.0, 18.0, 17.0, 16.0, 0.0, 8.0, 11.0, 4.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3709068298339844e-06, -1.3187527656555176e-06, -1.2665987014770508e-06, -1.214444637298584e-06, -1.1622905731201172e-06, -1.1101365089416504e-06, -1.0579824447631836e-06, -1.0058283805847168e-06, -9.5367431640625e-07, -9.015202522277832e-07, -8.493661880493164e-07, -7.972121238708496e-07, -7.450580596923828e-07, -6.92903995513916e-07, -6.407499313354492e-07, -5.885958671569824e-07, -5.364418029785156e-07, -4.842877388000488e-07, -4.3213367462158203e-07, -3.7997961044311523e-07, -3.2782554626464844e-07, -2.7567148208618164e-07, -2.2351741790771484e-07, -1.7136335372924805e-07, -1.1920928955078125e-07, -6.705522537231445e-08, -1.4901161193847656e-08, 3.725290298461914e-08, 8.940696716308594e-08, 1.4156103134155273e-07, 1.9371509552001953e-07, 2.4586915969848633e-07, 2.980232238769531e-07, 3.501772880554199e-07, 4.023313522338867e-07, 4.544854164123535e-07, 5.066394805908203e-07, 5.587935447692871e-07, 6.109476089477539e-07, 6.631016731262207e-07, 7.152557373046875e-07, 7.674098014831543e-07, 8.195638656616211e-07, 8.717179298400879e-07, 9.238719940185547e-07, 9.760260581970215e-07, 1.0281801223754883e-06, 1.080334186553955e-06, 1.1324882507324219e-06, 1.1846423149108887e-06, 1.2367963790893555e-06, 1.2889504432678223e-06, 1.341104507446289e-06, 1.3932585716247559e-06, 1.4454126358032227e-06, 1.4975666999816895e-06, 1.5497207641601562e-06, 1.601874828338623e-06, 1.6540288925170898e-06, 1.7061829566955566e-06, 1.7583370208740234e-06, 1.8104910850524902e-06, 1.862645149230957e-06, 1.914799213409424e-06, 1.9669532775878906e-06]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 8.0, 7.0, 10.0, 18.0, 20.0, 22.0, 45.0, 55.0, 70.0, 84.0, 125.0, 148.0, 196.0, 266.0, 352.0, 532.0, 789.0, 1066.0, 1607.0, 3061.0, 6206.0, 15310.0, 42871.0, 151805.0, 605966.0, 146555.0, 41896.0, 14992.0, 6084.0, 2928.0, 1678.0, 1079.0, 741.0, 486.0, 382.0, 297.0, 221.0, 133.0, 112.0, 88.0, 50.0, 59.0, 39.0, 17.0, 23.0, 18.0, 8.0, 10.0, 6.0, 4.0, 2.0, 6.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0003256797790527344, -0.00031565502285957336, -0.00030563026666641235, -0.00029560551047325134, -0.00028558075428009033, -0.0002755559980869293, -0.0002655312418937683, -0.0002555064857006073, -0.0002454817295074463, -0.00023545697331428528, -0.00022543221712112427, -0.00021540746092796326, -0.00020538270473480225, -0.00019535794854164124, -0.00018533319234848022, -0.00017530843615531921, -0.0001652836799621582, -0.0001552589237689972, -0.00014523416757583618, -0.00013520941138267517, -0.00012518465518951416, -0.00011515989899635315, -0.00010513514280319214, -9.511038661003113e-05, -8.508563041687012e-05, -7.50608742237091e-05, -6.50361180305481e-05, -5.5011361837387085e-05, -4.4986605644226074e-05, -3.4961849451065063e-05, -2.4937093257904053e-05, -1.4912337064743042e-05, -4.887580871582031e-06, 5.1371753215789795e-06, 1.516193151473999e-05, 2.5186687707901e-05, 3.521144390106201e-05, 4.523620009422302e-05, 5.526095628738403e-05, 6.528571248054504e-05, 7.531046867370605e-05, 8.533522486686707e-05, 9.535998106002808e-05, 0.00010538473725318909, 0.0001154094934463501, 0.0001254342496395111, 0.00013545900583267212, 0.00014548376202583313, 0.00015550851821899414, 0.00016553327441215515, 0.00017555803060531616, 0.00018558278679847717, 0.00019560754299163818, 0.0002056322991847992, 0.0002156570553779602, 0.00022568181157112122, 0.00023570656776428223, 0.00024573132395744324, 0.00025575608015060425, 0.00026578083634376526, 0.00027580559253692627, 0.0002858303487300873, 0.0002958551049232483, 0.0003058798611164093, 0.0003159046173095703]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 6.0, 13.0, 22.0, 36.0, 51.0, 85.0, 120.0, 267.0, 147.0, 73.0, 69.0, 39.0, 17.0, 10.0, 12.0, 9.0, 0.0, 5.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.98377799987793e-05, -9.667500853538513e-05, -9.351223707199097e-05, -9.03494656085968e-05, -8.718669414520264e-05, -8.402392268180847e-05, -8.08611512184143e-05, -7.769837975502014e-05, -7.453560829162598e-05, -7.137283682823181e-05, -6.821006536483765e-05, -6.504729390144348e-05, -6.188452243804932e-05, -5.872175097465515e-05, -5.5558979511260986e-05, -5.239620804786682e-05, -4.9233436584472656e-05, -4.607066512107849e-05, -4.2907893657684326e-05, -3.974512219429016e-05, -3.6582350730895996e-05, -3.341957926750183e-05, -3.0256807804107666e-05, -2.70940363407135e-05, -2.3931264877319336e-05, -2.076849341392517e-05, -1.7605721950531006e-05, -1.444295048713684e-05, -1.1280179023742676e-05, -8.11740756034851e-06, -4.954636096954346e-06, -1.7918646335601807e-06, 1.3709068298339844e-06, 4.533678293228149e-06, 7.696449756622314e-06, 1.085922122001648e-05, 1.4021992683410645e-05, 1.718476414680481e-05, 2.0347535610198975e-05, 2.351030707359314e-05, 2.6673078536987305e-05, 2.983585000038147e-05, 3.2998621463775635e-05, 3.61613929271698e-05, 3.9324164390563965e-05, 4.248693585395813e-05, 4.5649707317352295e-05, 4.881247878074646e-05, 5.1975250244140625e-05, 5.513802170753479e-05, 5.8300793170928955e-05, 6.146356463432312e-05, 6.462633609771729e-05, 6.778910756111145e-05, 7.095187902450562e-05, 7.411465048789978e-05, 7.727742195129395e-05, 8.044019341468811e-05, 8.360296487808228e-05, 8.676573634147644e-05, 8.99285078048706e-05, 9.309127926826477e-05, 9.625405073165894e-05, 9.94168221950531e-05, 0.00010257959365844727]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 5.0, 5.0, 7.0, 7.0, 14.0, 21.0, 17.0, 21.0, 23.0, 25.0, 36.0, 35.0, 72.0, 71.0, 74.0, 79.0, 72.0, 74.0, 74.0, 62.0, 39.0, 29.0, 27.0, 22.0, 15.0, 15.0, 15.0, 4.0, 5.0, 6.0, 6.0, 6.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003041747724637389, -0.0029391516000032425, -0.0028365557081997395, -0.0027339595835655928, -0.0026313636917620897, -0.002528767567127943, -0.00242617167532444, -0.0023235755506902933, -0.0022209796588867903, -0.0021183835342526436, -0.0020157876424491405, -0.0019131916342303157, -0.0018105956260114908, -0.0017079995013773441, -0.001605403609573841, -0.0015028074849396944, -0.0014002114767208695, -0.0012976154685020447, -0.0011950194602832198, -0.001092423452064395, -0.00098982744384557, -0.0008872313774190843, -0.0007846353692002594, -0.0006820393609814346, -0.0005794433527626097, -0.00047684734454378486, -0.00037425133632496, -0.0002716552990023047, -0.0001690592907834798, -6.646325346082449e-05, 3.6132754758000374e-05, 0.00013872876297682524, 0.0002413247711956501, 0.00034392077941447496, 0.00044651678763329983, 0.0005491127958521247, 0.0006517088040709496, 0.0007543048704974353, 0.0008569008787162602, 0.0009594968869350851, 0.001062092836946249, 0.0011646888451650739, 0.0012672848533838987, 0.0013698808616027236, 0.0014724768698215485, 0.0015750729944556952, 0.0016776688862591982, 0.0017802650108933449, 0.0018828610191121697, 0.0019854570273309946, 0.0020880531519651413, 0.0021906490437686443, 0.002293245168402791, 0.002395841060206294, 0.0024984371848404408, 0.002601033076643944, 0.0027036292012780905, 0.002806225325912237, 0.00290882121771574, 0.003011417342349887, 0.00311401323415339, 0.0032166093587875366, 0.0033192052505910397, 0.0034218013752251863, 0.0035243972670286894]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 8.0, 4.0, 6.0, 7.0, 7.0, 16.0, 15.0, 14.0, 10.0, 18.0, 30.0, 27.0, 21.0, 27.0, 29.0, 37.0, 36.0, 41.0, 32.0, 42.0, 39.0, 40.0, 32.0, 44.0, 46.0, 38.0, 41.0, 39.0, 31.0, 36.0, 22.0, 21.0, 24.0, 18.0, 12.0, 19.0, 9.0, 11.0, 14.0, 7.0, 5.0, 13.0, 8.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0019394051050767303, -0.0018766878638416529, -0.0018139707390218973, -0.00175125349778682, -0.0016885362565517426, -0.001625819131731987, -0.0015631018904969096, -0.0015003846492618322, -0.0014376675244420767, -0.0013749502832069993, -0.0013122331583872437, -0.0012495159171521664, -0.001186798675917089, -0.0011240814346820116, -0.001061364309862256, -0.0009986470686271787, -0.0009359298273921013, -0.0008732126443646848, -0.0008104954031296074, -0.000747778220102191, -0.0006850609788671136, -0.0006223437958396971, -0.0005596266128122807, -0.0004969093715772033, -0.0004341921885497868, -0.0003714749764185399, -0.00030875776428729296, -0.0002460405812598765, -0.00018332336912862957, -0.00012060615699738264, -5.788897396996617e-05, 4.828238161280751e-06, 6.75455667078495e-05, 0.00013026277883909643, 0.00019297997641842812, 0.0002556971739977598, 0.00031841438612900674, 0.00038113159826025367, 0.00044384878128767014, 0.0005065660225227475, 0.000569283205550164, 0.0006320003885775805, 0.0006947176298126578, 0.0007574348128400743, 0.0008201519958674908, 0.0008828692371025681, 0.0009455864201299846, 0.001008303603157401, 0.0010710208443924785, 0.0011337380856275558, 0.0011964552104473114, 0.0012591724516823888, 0.0013218896929174662, 0.0013846068177372217, 0.001447324058972299, 0.0015100413002073765, 0.001572758425027132, 0.0016354756662622094, 0.001698192791081965, 0.0017609100323170424, 0.0018236272735521197, 0.0018863445147871971, 0.0019490616396069527, 0.0020117787644267082, 0.0020744961220771074]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 8.0, 5.0, 16.0, 25.0, 33.0, 47.0, 64.0, 75.0, 113.0, 169.0, 268.0, 388.0, 542.0, 754.0, 1236.0, 1759.0, 2686.0, 4105.0, 6355.0, 9930.0, 15764.0, 25688.0, 42731.0, 72854.0, 125446.0, 196854.0, 206690.0, 134757.0, 78644.0, 45652.0, 27586.0, 16761.0, 10707.0, 6820.0, 4355.0, 2907.0, 1894.0, 1200.0, 820.0, 573.0, 424.0, 257.0, 188.0, 130.0, 80.0, 69.0, 36.0, 40.0, 13.0, 11.0, 13.0, 8.0, 2.0, 5.0, 4.0, 2.0, 1.0, 1.0], "bins": [-0.004360198974609375, -0.004224240779876709, -0.004088282585144043, -0.003952324390411377, -0.003816366195678711, -0.003680408000946045, -0.003544449806213379, -0.003408491611480713, -0.003272533416748047, -0.003136575222015381, -0.003000617027282715, -0.002864658832550049, -0.002728700637817383, -0.002592742443084717, -0.0024567842483520508, -0.0023208260536193848, -0.0021848678588867188, -0.0020489096641540527, -0.0019129514694213867, -0.0017769932746887207, -0.0016410350799560547, -0.0015050768852233887, -0.0013691186904907227, -0.0012331604957580566, -0.0010972023010253906, -0.0009612441062927246, -0.0008252859115600586, -0.0006893277168273926, -0.0005533695220947266, -0.00041741132736206055, -0.00028145313262939453, -0.00014549493789672852, -9.5367431640625e-06, 0.00012642145156860352, 0.00026237964630126953, 0.00039833784103393555, 0.0005342960357666016, 0.0006702542304992676, 0.0008062124252319336, 0.0009421706199645996, 0.0010781288146972656, 0.0012140870094299316, 0.0013500452041625977, 0.0014860033988952637, 0.0016219615936279297, 0.0017579197883605957, 0.0018938779830932617, 0.0020298361778259277, 0.0021657943725585938, 0.0023017525672912598, 0.0024377107620239258, 0.002573668956756592, 0.002709627151489258, 0.002845585346221924, 0.00298154354095459, 0.003117501735687256, 0.003253459930419922, 0.003389418125152588, 0.003525376319885254, 0.00366133451461792, 0.003797292709350586, 0.003933250904083252, 0.004069209098815918, 0.004205167293548584, 0.00434112548828125]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 9.0, 5.0, 15.0, 14.0, 19.0, 11.0, 20.0, 24.0, 19.0, 26.0, 28.0, 35.0, 39.0, 38.0, 23.0, 49.0, 36.0, 43.0, 47.0, 46.0, 40.0, 33.0, 53.0, 45.0, 43.0, 41.0, 20.0, 25.0, 16.0, 17.0, 18.0, 14.0, 17.0, 9.0, 15.0, 6.0, 7.0, 7.0, 8.0, 6.0, 6.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0018968582153320312, -0.0018335431814193726, -0.0017702281475067139, -0.0017069131135940552, -0.0016435980796813965, -0.0015802830457687378, -0.001516968011856079, -0.0014536529779434204, -0.0013903379440307617, -0.001327022910118103, -0.0012637078762054443, -0.0012003928422927856, -0.001137077808380127, -0.0010737627744674683, -0.0010104477405548096, -0.0009471327066421509, -0.0008838176727294922, -0.0008205026388168335, -0.0007571876049041748, -0.0006938725709915161, -0.0006305575370788574, -0.0005672425031661987, -0.00050392746925354, -0.00044061243534088135, -0.00037729740142822266, -0.00031398236751556396, -0.0002506673336029053, -0.00018735229969024658, -0.0001240372657775879, -6.07222318649292e-05, 2.592802047729492e-06, 6.590783596038818e-05, 0.00012922286987304688, 0.00019253790378570557, 0.00025585293769836426, 0.00031916797161102295, 0.00038248300552368164, 0.00044579803943634033, 0.000509113073348999, 0.0005724281072616577, 0.0006357431411743164, 0.0006990581750869751, 0.0007623732089996338, 0.0008256882429122925, 0.0008890032768249512, 0.0009523183107376099, 0.0010156333446502686, 0.0010789483785629272, 0.001142263412475586, 0.0012055784463882446, 0.0012688934803009033, 0.001332208514213562, 0.0013955235481262207, 0.0014588385820388794, 0.001522153615951538, 0.0015854686498641968, 0.0016487836837768555, 0.0017120987176895142, 0.0017754137516021729, 0.0018387287855148315, 0.0019020438194274902, 0.001965358853340149, 0.0020286738872528076, 0.0020919889211654663, 0.002155303955078125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 6.0, 20.0, 24.0, 23.0, 45.0, 57.0, 97.0, 126.0, 185.0, 287.0, 396.0, 561.0, 785.0, 1198.0, 1616.0, 2512.0, 3720.0, 5548.0, 8678.0, 13637.0, 21082.0, 34192.0, 56078.0, 94931.0, 156257.0, 218712.0, 166781.0, 100045.0, 60147.0, 36253.0, 22670.0, 14281.0, 9113.0, 6056.0, 4034.0, 2723.0, 1776.0, 1221.0, 846.0, 545.0, 393.0, 274.0, 192.0, 137.0, 87.0, 64.0, 46.0, 31.0, 20.0, 21.0, 11.0, 7.0, 4.0, 4.0, 4.0, 1.0, 1.0], "bins": [-0.004405975341796875, -0.004270672798156738, -0.0041353702545166016, -0.004000067710876465, -0.003864765167236328, -0.0037294626235961914, -0.0035941600799560547, -0.003458857536315918, -0.0033235549926757812, -0.0031882524490356445, -0.003052949905395508, -0.002917647361755371, -0.0027823448181152344, -0.0026470422744750977, -0.002511739730834961, -0.0023764371871948242, -0.0022411346435546875, -0.0021058320999145508, -0.001970529556274414, -0.0018352270126342773, -0.0016999244689941406, -0.001564621925354004, -0.0014293193817138672, -0.0012940168380737305, -0.0011587142944335938, -0.001023411750793457, -0.0008881092071533203, -0.0007528066635131836, -0.0006175041198730469, -0.00048220157623291016, -0.00034689903259277344, -0.00021159648895263672, -7.62939453125e-05, 5.900859832763672e-05, 0.00019431114196777344, 0.00032961368560791016, 0.0004649162292480469, 0.0006002187728881836, 0.0007355213165283203, 0.000870823860168457, 0.0010061264038085938, 0.0011414289474487305, 0.0012767314910888672, 0.001412034034729004, 0.0015473365783691406, 0.0016826391220092773, 0.001817941665649414, 0.0019532442092895508, 0.0020885467529296875, 0.0022238492965698242, 0.002359151840209961, 0.0024944543838500977, 0.0026297569274902344, 0.002765059471130371, 0.002900362014770508, 0.0030356645584106445, 0.0031709671020507812, 0.003306269645690918, 0.0034415721893310547, 0.0035768747329711914, 0.003712177276611328, 0.003847479820251465, 0.0039827823638916016, 0.004118084907531738, 0.004253387451171875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 3.0, 3.0, 3.0, 3.0, 7.0, 5.0, 3.0, 13.0, 6.0, 14.0, 9.0, 10.0, 20.0, 17.0, 20.0, 35.0, 38.0, 44.0, 33.0, 44.0, 46.0, 44.0, 50.0, 41.0, 49.0, 39.0, 32.0, 43.0, 40.0, 41.0, 28.0, 33.0, 20.0, 27.0, 17.0, 21.0, 17.0, 14.0, 13.0, 13.0, 7.0, 8.0, 8.0, 8.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012731552124023438, -0.0012330859899520874, -0.001193016767501831, -0.0011529475450515747, -0.0011128783226013184, -0.001072809100151062, -0.0010327398777008057, -0.0009926706552505493, -0.000952601432800293, -0.0009125322103500366, -0.0008724629878997803, -0.0008323937654495239, -0.0007923245429992676, -0.0007522553205490112, -0.0007121860980987549, -0.0006721168756484985, -0.0006320476531982422, -0.0005919784307479858, -0.0005519092082977295, -0.0005118399858474731, -0.0004717707633972168, -0.00043170154094696045, -0.0003916323184967041, -0.00035156309604644775, -0.0003114938735961914, -0.00027142465114593506, -0.0002313554286956787, -0.00019128620624542236, -0.00015121698379516602, -0.00011114776134490967, -7.107853889465332e-05, -3.100931644439697e-05, 9.059906005859375e-06, 4.912912845611572e-05, 8.919835090637207e-05, 0.00012926757335662842, 0.00016933679580688477, 0.0002094060182571411, 0.00024947524070739746, 0.0002895444631576538, 0.00032961368560791016, 0.0003696829080581665, 0.00040975213050842285, 0.0004498213529586792, 0.0004898905754089355, 0.0005299597978591919, 0.0005700290203094482, 0.0006100982427597046, 0.0006501674652099609, 0.0006902366876602173, 0.0007303059101104736, 0.00077037513256073, 0.0008104443550109863, 0.0008505135774612427, 0.000890582799911499, 0.0009306520223617554, 0.0009707212448120117, 0.001010790467262268, 0.0010508596897125244, 0.0010909289121627808, 0.0011309981346130371, 0.0011710673570632935, 0.0012111365795135498, 0.0012512058019638062, 0.0012912750244140625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 12.0, 18.0, 25.0, 33.0, 53.0, 57.0, 84.0, 128.0, 195.0, 312.0, 459.0, 693.0, 1011.0, 1553.0, 2595.0, 4346.0, 7767.0, 16104.0, 39927.0, 156192.0, 631105.0, 119543.0, 34042.0, 14296.0, 7151.0, 3997.0, 2385.0, 1551.0, 999.0, 630.0, 421.0, 257.0, 198.0, 129.0, 91.0, 56.0, 53.0, 29.0, 17.0, 10.0, 10.0, 7.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0025196075439453125, -0.002446413040161133, -0.002373218536376953, -0.0023000240325927734, -0.0022268295288085938, -0.002153635025024414, -0.0020804405212402344, -0.0020072460174560547, -0.001934051513671875, -0.0018608570098876953, -0.0017876625061035156, -0.001714468002319336, -0.0016412734985351562, -0.0015680789947509766, -0.0014948844909667969, -0.0014216899871826172, -0.0013484954833984375, -0.0012753009796142578, -0.0012021064758300781, -0.0011289119720458984, -0.0010557174682617188, -0.000982522964477539, -0.0009093284606933594, -0.0008361339569091797, -0.000762939453125, -0.0006897449493408203, -0.0006165504455566406, -0.0005433559417724609, -0.00047016143798828125, -0.00039696693420410156, -0.0003237724304199219, -0.0002505779266357422, -0.0001773834228515625, -0.00010418891906738281, -3.0994415283203125e-05, 4.220008850097656e-05, 0.00011539459228515625, 0.00018858909606933594, 0.0002617835998535156, 0.0003349781036376953, 0.000408172607421875, 0.0004813671112060547, 0.0005545616149902344, 0.0006277561187744141, 0.0007009506225585938, 0.0007741451263427734, 0.0008473396301269531, 0.0009205341339111328, 0.0009937286376953125, 0.0010669231414794922, 0.0011401176452636719, 0.0012133121490478516, 0.0012865066528320312, 0.001359701156616211, 0.0014328956604003906, 0.0015060901641845703, 0.00157928466796875, 0.0016524791717529297, 0.0017256736755371094, 0.001798868179321289, 0.0018720626831054688, 0.0019452571868896484, 0.002018451690673828, 0.002091646194458008, 0.0021648406982421875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 0.0, 0.0, 9.0, 0.0, 0.0, 0.0, 15.0, 0.0, 0.0, 38.0, 0.0, 0.0, 90.0, 0.0, 0.0, 104.0, 0.0, 0.0, 141.0, 0.0, 0.0, 0.0, 166.0, 0.0, 0.0, 153.0, 0.0, 0.0, 110.0, 0.0, 0.0, 91.0, 0.0, 0.0, 50.0, 0.0, 0.0, 0.0, 27.0, 0.0, 0.0, 16.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.960464477539062e-07, -5.774199962615967e-07, -5.587935447692871e-07, -5.401670932769775e-07, -5.21540641784668e-07, -5.029141902923584e-07, -4.842877388000488e-07, -4.6566128730773926e-07, -4.470348358154297e-07, -4.284083843231201e-07, -4.0978193283081055e-07, -3.91155481338501e-07, -3.725290298461914e-07, -3.5390257835388184e-07, -3.3527612686157227e-07, -3.166496753692627e-07, -2.980232238769531e-07, -2.7939677238464355e-07, -2.60770320892334e-07, -2.421438694000244e-07, -2.2351741790771484e-07, -2.0489096641540527e-07, -1.862645149230957e-07, -1.6763806343078613e-07, -1.4901161193847656e-07, -1.30385160446167e-07, -1.1175870895385742e-07, -9.313225746154785e-08, -7.450580596923828e-08, -5.587935447692871e-08, -3.725290298461914e-08, -1.862645149230957e-08, 0.0, 1.862645149230957e-08, 3.725290298461914e-08, 5.587935447692871e-08, 7.450580596923828e-08, 9.313225746154785e-08, 1.1175870895385742e-07, 1.30385160446167e-07, 1.4901161193847656e-07, 1.6763806343078613e-07, 1.862645149230957e-07, 2.0489096641540527e-07, 2.2351741790771484e-07, 2.421438694000244e-07, 2.60770320892334e-07, 2.7939677238464355e-07, 2.980232238769531e-07, 3.166496753692627e-07, 3.3527612686157227e-07, 3.5390257835388184e-07, 3.725290298461914e-07, 3.91155481338501e-07, 4.0978193283081055e-07, 4.284083843231201e-07, 4.470348358154297e-07, 4.6566128730773926e-07, 4.842877388000488e-07, 5.029141902923584e-07, 5.21540641784668e-07, 5.401670932769775e-07, 5.587935447692871e-07, 5.774199962615967e-07, 5.960464477539062e-07]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 6.0, 10.0, 8.0, 21.0, 21.0, 34.0, 48.0, 65.0, 90.0, 118.0, 153.0, 221.0, 350.0, 524.0, 711.0, 998.0, 1485.0, 2083.0, 3089.0, 4772.0, 7995.0, 14673.0, 32868.0, 98419.0, 613869.0, 174279.0, 45920.0, 18858.0, 9814.0, 5683.0, 3541.0, 2332.0, 1688.0, 1086.0, 803.0, 557.0, 380.0, 289.0, 198.0, 144.0, 97.0, 78.0, 49.0, 39.0, 21.0, 18.0, 14.0, 12.0, 11.0, 3.0, 2.0, 4.0, 5.0, 2.0, 2.0], "bins": [-0.002513885498046875, -0.0024392306804656982, -0.0023645758628845215, -0.0022899210453033447, -0.002215266227722168, -0.002140611410140991, -0.0020659565925598145, -0.0019913017749786377, -0.001916646957397461, -0.0018419921398162842, -0.0017673373222351074, -0.0016926825046539307, -0.001618027687072754, -0.0015433728694915771, -0.0014687180519104004, -0.0013940632343292236, -0.0013194084167480469, -0.0012447535991668701, -0.0011700987815856934, -0.0010954439640045166, -0.0010207891464233398, -0.0009461343288421631, -0.0008714795112609863, -0.0007968246936798096, -0.0007221698760986328, -0.0006475150585174561, -0.0005728602409362793, -0.0004982054233551025, -0.0004235506057739258, -0.000348895788192749, -0.00027424097061157227, -0.0001995861530303955, -0.00012493133544921875, -5.027651786804199e-05, 2.4378299713134766e-05, 9.903311729431152e-05, 0.00017368793487548828, 0.00024834275245666504, 0.0003229975700378418, 0.00039765238761901855, 0.0004723072052001953, 0.0005469620227813721, 0.0006216168403625488, 0.0006962716579437256, 0.0007709264755249023, 0.0008455812931060791, 0.0009202361106872559, 0.0009948909282684326, 0.0010695457458496094, 0.0011442005634307861, 0.0012188553810119629, 0.0012935101985931396, 0.0013681650161743164, 0.0014428198337554932, 0.00151747465133667, 0.0015921294689178467, 0.0016667842864990234, 0.0017414391040802002, 0.001816093921661377, 0.0018907487392425537, 0.0019654035568237305, 0.0020400583744049072, 0.002114713191986084, 0.0021893680095672607, 0.0022640228271484375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 8.0, 4.0, 3.0, 7.0, 5.0, 6.0, 10.0, 8.0, 21.0, 24.0, 33.0, 58.0, 67.0, 105.0, 142.0, 129.0, 103.0, 76.0, 40.0, 41.0, 26.0, 19.0, 9.0, 11.0, 5.0, 10.0, 1.0, 4.0, 5.0, 7.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007004737854003906, -0.00067930668592453, -0.0006581395864486694, -0.0006369724869728088, -0.0006158053874969482, -0.0005946382880210876, -0.000573471188545227, -0.0005523040890693665, -0.0005311369895935059, -0.0005099698901176453, -0.0004888027906417847, -0.00046763569116592407, -0.0004464685916900635, -0.0004253014922142029, -0.0004041343927383423, -0.0003829672932624817, -0.0003618001937866211, -0.0003406330943107605, -0.0003194659948348999, -0.0002982988953590393, -0.0002771317958831787, -0.0002559646964073181, -0.00023479759693145752, -0.00021363049745559692, -0.00019246339797973633, -0.00017129629850387573, -0.00015012919902801514, -0.00012896209955215454, -0.00010779500007629395, -8.662790060043335e-05, -6.546080112457275e-05, -4.429370164871216e-05, -2.3126602172851562e-05, -1.959502696990967e-06, 1.920759677886963e-05, 4.0374696254730225e-05, 6.154179573059082e-05, 8.270889520645142e-05, 0.00010387599468231201, 0.0001250430941581726, 0.0001462101936340332, 0.0001673772931098938, 0.0001885443925857544, 0.000209711492061615, 0.00023087859153747559, 0.0002520456910133362, 0.0002732127904891968, 0.0002943798899650574, 0.00031554698944091797, 0.00033671408891677856, 0.00035788118839263916, 0.00037904828786849976, 0.00040021538734436035, 0.00042138248682022095, 0.00044254958629608154, 0.00046371668577194214, 0.00048488378524780273, 0.0005060508847236633, 0.0005272179841995239, 0.0005483850836753845, 0.0005695521831512451, 0.0005907192826271057, 0.0006118863821029663, 0.0006330534815788269, 0.0006542205810546875]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 5.0, 4.0, 5.0, 6.0, 3.0, 15.0, 13.0, 21.0, 19.0, 20.0, 16.0, 37.0, 29.0, 32.0, 40.0, 60.0, 71.0, 54.0, 78.0, 72.0, 74.0, 47.0, 39.0, 38.0, 33.0, 25.0, 26.0, 25.0, 17.0, 9.0, 9.0, 9.0, 8.0, 14.0, 5.0, 4.0, 6.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0031117377802729607, -0.0030121023301035166, -0.0029124668799340725, -0.0028128311969339848, -0.0027131957467645407, -0.0026135602965950966, -0.0025139248464256525, -0.0024142893962562084, -0.0023146537132561207, -0.0022150182630866766, -0.0021153828129172325, -0.0020157471299171448, -0.0019161116797477007, -0.0018164762295782566, -0.0017168407794088125, -0.0016172053292393684, -0.0015175698790699244, -0.0014179344289004803, -0.0013182988623157144, -0.0012186634121462703, -0.0011190278455615044, -0.0010193923953920603, -0.0009197569452226162, -0.0008201214368455112, -0.0007204859284684062, -0.0006208504200913012, -0.0005212149117141962, -0.0004215794615447521, -0.0003219439531676471, -0.00022230844479054213, -0.00012267299462109804, -2.3037486243993044e-05, 7.659825496375561e-05, 0.00017623374878894538, 0.00027586924261413515, 0.0003755047218874097, 0.0004751402302645147, 0.0005747757386416197, 0.0006744111888110638, 0.0007740466971881688, 0.0008736822055652738, 0.0009733177139423788, 0.0010729532223194838, 0.0011725886724889278, 0.001272224122658372, 0.0013718596892431378, 0.001471495139412582, 0.0015711307059973478, 0.001670766156166792, 0.001770401606336236, 0.001870037172921002, 0.001969672739505768, 0.002069308189675212, 0.002168943639844656, 0.0022685790900141, 0.002368214540183544, 0.002467850223183632, 0.002567485673353076, 0.00266712112352252, 0.002766756806522608, 0.002866392256692052, 0.002966027706861496, 0.00306566315703094, 0.003165298607200384, 0.0032649340573698282]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 4.0, 5.0, 12.0, 8.0, 7.0, 14.0, 10.0, 25.0, 15.0, 28.0, 28.0, 34.0, 31.0, 33.0, 23.0, 30.0, 31.0, 42.0, 47.0, 43.0, 60.0, 39.0, 41.0, 38.0, 30.0, 35.0, 32.0, 34.0, 24.0, 24.0, 25.0, 21.0, 28.0, 17.0, 16.0, 8.0, 9.0, 12.0, 6.0, 10.0, 8.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.002139362273737788, -0.0020688376389443874, -0.0019983130041509867, -0.0019277884857729077, -0.001857263850979507, -0.0017867392161861062, -0.0017162146978080273, -0.0016456900630146265, -0.0015751654282212257, -0.001504640793427825, -0.0014341161586344242, -0.0013635916402563453, -0.0012930670054629445, -0.0012225423706695437, -0.0011520178522914648, -0.001081493217498064, -0.0010109685827046633, -0.0009404439479112625, -0.0008699193713255227, -0.0007993947947397828, -0.000728870159946382, -0.0006583455251529813, -0.0005878209485672414, -0.0005172963719815016, -0.0004467717371881008, -0.0003762471314985305, -0.0003057225258089602, -0.0002351979201193899, -0.00016467331442981958, -9.414870874024928e-05, -2.362410305067897e-05, 4.690047353506088e-05, 0.0001174253411591053, 0.0001879499468486756, 0.0002584745525382459, 0.0003289991582278162, 0.00039952376391738653, 0.00047004836960695684, 0.0005405729752965271, 0.000611097551882267, 0.0006816221866756678, 0.0007521468214690685, 0.0008226713980548084, 0.0008931959746405482, 0.000963720609433949, 0.0010342452442273498, 0.0011047697626054287, 0.0011752943973988295, 0.0012458190321922302, 0.001316343666985631, 0.0013868683017790318, 0.0014573928201571107, 0.0015279174549505115, 0.0015984420897439122, 0.0016689666081219912, 0.001739491242915392, 0.0018100158777087927, 0.0018805405125021935, 0.0019510651472955942, 0.002021589782088995, 0.002092114184051752, 0.002162638818845153, 0.0022331634536385536, 0.0023036880884319544, 0.002374212723225355]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 8.0, 5.0, 3.0, 4.0, 4.0, 8.0, 11.0, 14.0, 20.0, 16.0, 26.0, 26.0, 34.0, 42.0, 45.0, 45.0, 55.0, 68.0, 68.0, 92.0, 123.0, 212.0, 421.0, 1239.0, 517950.0, 1980.0, 676.0, 279.0, 154.0, 87.0, 68.0, 72.0, 74.0, 51.0, 51.0, 50.0, 32.0, 31.0, 25.0, 14.0, 18.0, 15.0, 6.0, 12.0, 7.0, 8.0, 6.0, 3.0, 2.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0600602887570858, -0.058167267590761185, -0.05627424642443657, -0.054381225258111954, -0.05248820036649704, -0.050595179200172424, -0.04870215803384781, -0.04680913686752319, -0.04491611570119858, -0.04302309453487396, -0.04113007336854935, -0.03923705220222473, -0.037344031035900116, -0.0354510098695755, -0.03355798497796059, -0.03166496381163597, -0.029771942645311356, -0.02787892147898674, -0.025985900312662125, -0.02409287728369236, -0.022199856117367744, -0.02030683495104313, -0.018413811922073364, -0.01652079075574875, -0.014627769589424133, -0.012734748423099518, -0.010841726325452328, -0.008948704227805138, -0.007055683061480522, -0.005162661895155907, -0.0032696397975087166, -0.0013766176998615265, 0.0005164071917533875, 0.0024094288237392902, 0.004302450455725193, 0.006195472087711096, 0.008088493719696999, 0.009981514886021614, 0.011874536983668804, 0.013767559081315994, 0.01566058024764061, 0.017553601413965225, 0.01944662258028984, 0.021339645609259605, 0.02323266677558422, 0.025125687941908836, 0.0270187109708786, 0.028911732137203217, 0.030804753303527832, 0.03269777446985245, 0.03459079563617706, 0.03648381680250168, 0.038376837968826294, 0.04026985913515091, 0.04216288402676582, 0.04405590519309044, 0.045948926359415054, 0.04784194752573967, 0.049734968692064285, 0.0516279898583889, 0.053521014750003815, 0.05541403591632843, 0.057307057082653046, 0.05920007824897766, 0.06109309941530228]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 6.0, 4.0, 4.0, 8.0, 11.0, 13.0, 11.0, 9.0, 24.0, 20.0, 24.0, 29.0, 25.0, 40.0, 32.0, 30.0, 26.0, 36.0, 43.0, 49.0, 53.0, 1070.0, 48.0, 39.0, 39.0, 32.0, 30.0, 30.0, 31.0, 29.0, 20.0, 29.0, 20.0, 23.0, 21.0, 7.0, 9.0, 12.0, 13.0, 7.0, 6.0, 5.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.06292717158794403, -0.06084686145186424, -0.058766547590494156, -0.05668623745441437, -0.05460592359304428, -0.05252561345696449, -0.050445303320884705, -0.04836498945951462, -0.04628467932343483, -0.04420436918735504, -0.042124055325984955, -0.04004374518990517, -0.03796343505382538, -0.03588312119245529, -0.033802811056375504, -0.031722500920295715, -0.02964218705892563, -0.02756187506020069, -0.025481563061475754, -0.023401252925395966, -0.021320940926671028, -0.01924062892794609, -0.017160318791866302, -0.015080006793141365, -0.012999694794416428, -0.01091938279569149, -0.008839071728289127, -0.006758760195225477, -0.004678448662161827, -0.0025981366634368896, -0.0005178255960345268, 0.001562485471367836, 0.0036427974700927734, 0.005723109003156424, 0.007803420536220074, 0.009883731603622437, 0.011964043602347374, 0.014044355601072311, 0.0161246657371521, 0.018204977735877037, 0.020285289734601974, 0.022365601733326912, 0.02444591373205185, 0.026526223868131638, 0.028606535866856575, 0.030686847865581512, 0.0327671580016613, 0.03484746813774109, 0.036927781999111176, 0.039008092135190964, 0.04108840599656105, 0.04316871613264084, 0.045249029994010925, 0.047329340130090714, 0.0494096502661705, 0.05148996412754059, 0.05357027426362038, 0.055650584399700165, 0.05773089826107025, 0.05981120839715004, 0.06189151853322983, 0.06397183239459991, 0.06605214625597, 0.06813245266675949, 0.07021276652812958]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 7.0, 4.0, 5.0, 4.0, 4.0, 3.0, 8.0, 6.0, 7.0, 7.0, 5.0, 8.0, 8.0, 10.0, 11.0, 24.0, 32.0, 26.0, 67.0, 91.0, 139.0, 158.0, 229.0, 310.0, 484.0, 562.0, 684.0, 730.0, 826.0, 1078.0, 1752.0, 4284.0, 31200018.0, 24526.0, 5359.0, 10877.0, 1088.0, 247.0, 140.0, 104.0, 148.0, 178.0, 235.0, 8.0, 5.0], "bins": [-14480.0, -14200.5625, -13921.125, -13641.6875, -13362.25, -13082.8125, -12803.375, -12523.9375, -12244.5, -11965.0625, -11685.625, -11406.1875, -11126.75, -10847.3125, -10567.875, -10288.4375, -10009.0, -9729.5625, -9450.125, -9170.6875, -8891.25, -8611.8125, -8332.375, -8052.9375, -7773.5, -7494.0625, -7214.625, -6935.1875, -6655.75, -6376.3125, -6096.875, -5817.4375, -5538.0, -5258.5625, -4979.125, -4699.6875, -4420.25, -4140.8125, -3861.375, -3581.9375, -3302.5, -3023.0625, -2743.625, -2464.1875, -2184.75, -1905.3125, -1625.875, -1346.4375, -1067.0, -787.5625, -508.125, -228.6875, 50.75, 330.1875, 609.625, 889.0625, 1168.5, 1447.9375, 1727.375, 2006.8125, 2286.25, 2565.6875, 2845.125, 3124.5625, 3404.0]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 5.0, 6.0, 9.0, 11.0, 14.0, 23.0, 33.0, 36.0, 56.0, 103.0, 142.0, 250.0, 256.0, 413.0, 484.0, 849.0, 1240.0, 1695.0, 2458.0, 3887.0, 6366.0, 9812.0, 16270.0, 28316.0, 52156.0, 102137.0, 219040.0, 560842.0, 3521326.0, 1110794.0, 338498.0, 147054.0, 72400.0, 38285.0, 21191.0, 12576.0, 7878.0, 4856.0, 3072.0, 2080.0, 1392.0, 988.0, 658.0, 435.0, 271.0, 205.0, 170.0, 119.0, 82.0, 57.0, 46.0, 36.0, 18.0, 11.0, 11.0, 7.0, 11.0, 5.0], "bins": [-30.1875, -29.319091796875, -28.45068359375, -27.582275390625, -26.7138671875, -25.845458984375, -24.97705078125, -24.108642578125, -23.240234375, -22.371826171875, -21.50341796875, -20.635009765625, -19.7666015625, -18.898193359375, -18.02978515625, -17.161376953125, -16.29296875, -15.424560546875, -14.55615234375, -13.687744140625, -12.8193359375, -11.950927734375, -11.08251953125, -10.214111328125, -9.345703125, -8.477294921875, -7.60888671875, -6.740478515625, -5.8720703125, -5.003662109375, -4.13525390625, -3.266845703125, -2.3984375, -1.530029296875, -0.66162109375, 0.206787109375, 1.0751953125, 1.943603515625, 2.81201171875, 3.680419921875, 4.548828125, 5.417236328125, 6.28564453125, 7.154052734375, 8.0224609375, 8.890869140625, 9.75927734375, 10.627685546875, 11.49609375, 12.364501953125, 13.23291015625, 14.101318359375, 14.9697265625, 15.838134765625, 16.70654296875, 17.574951171875, 18.443359375, 19.311767578125, 20.18017578125, 21.048583984375, 21.9169921875, 22.785400390625, 23.65380859375, 24.522216796875, 25.390625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 10.0, 6.0, 5.0, 12.0, 13.0, 12.0, 20.0, 25.0, 26.0, 22.0, 33.0, 27.0, 41.0, 33.0, 33.0, 51.0, 41.0, 77.0, 463.0, 352.0, 175.0, 95.0, 71.0, 69.0, 51.0, 55.0, 30.0, 23.0, 25.0, 20.0, 21.0, 13.0, 13.0, 16.0, 12.0, 9.0, 6.0, 3.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-42.53125, -41.1435546875, -39.755859375, -38.3681640625, -36.98046875, -35.5927734375, -34.205078125, -32.8173828125, -31.4296875, -30.0419921875, -28.654296875, -27.2666015625, -25.87890625, -24.4912109375, -23.103515625, -21.7158203125, -20.328125, -18.9404296875, -17.552734375, -16.1650390625, -14.77734375, -13.3896484375, -12.001953125, -10.6142578125, -9.2265625, -7.8388671875, -6.451171875, -5.0634765625, -3.67578125, -2.2880859375, -0.900390625, 0.4873046875, 1.875, 3.2626953125, 4.650390625, 6.0380859375, 7.42578125, 8.8134765625, 10.201171875, 11.5888671875, 12.9765625, 14.3642578125, 15.751953125, 17.1396484375, 18.52734375, 19.9150390625, 21.302734375, 22.6904296875, 24.078125, 25.4658203125, 26.853515625, 28.2412109375, 29.62890625, 31.0166015625, 32.404296875, 33.7919921875, 35.1796875, 36.5673828125, 37.955078125, 39.3427734375, 40.73046875, 42.1181640625, 43.505859375, 44.8935546875, 46.28125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 6.0, 2.0, 0.0, 0.0, 3.0, 12.0, 13.0, 19.0, 10.0, 25.0, 43.0, 68.0, 61.0, 118.0, 171.0, 228.0, 300.0, 469.0, 742.0, 1167.0, 1730.0, 2849.0, 4922.0, 9025.0, 17520.0, 37802.0, 100154.0, 356685.0, 4214652.0, 1197955.0, 216706.0, 68464.0, 28081.0, 13391.0, 7270.0, 4220.0, 2309.0, 1467.0, 933.0, 609.0, 393.0, 263.0, 196.0, 140.0, 63.0, 70.0, 36.0, 23.0, 22.0, 18.0, 8.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-56.65625, -54.9296875, -53.203125, -51.4765625, -49.75, -48.0234375, -46.296875, -44.5703125, -42.84375, -41.1171875, -39.390625, -37.6640625, -35.9375, -34.2109375, -32.484375, -30.7578125, -29.03125, -27.3046875, -25.578125, -23.8515625, -22.125, -20.3984375, -18.671875, -16.9453125, -15.21875, -13.4921875, -11.765625, -10.0390625, -8.3125, -6.5859375, -4.859375, -3.1328125, -1.40625, 0.3203125, 2.046875, 3.7734375, 5.5, 7.2265625, 8.953125, 10.6796875, 12.40625, 14.1328125, 15.859375, 17.5859375, 19.3125, 21.0390625, 22.765625, 24.4921875, 26.21875, 27.9453125, 29.671875, 31.3984375, 33.125, 34.8515625, 36.578125, 38.3046875, 40.03125, 41.7578125, 43.484375, 45.2109375, 46.9375, 48.6640625, 50.390625, 52.1171875, 53.84375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 1.0, 3.0, 4.0, 6.0, 4.0, 8.0, 9.0, 12.0, 14.0, 21.0, 20.0, 30.0, 35.0, 50.0, 46.0, 52.0, 52.0, 58.0, 88.0, 723.0, 321.0, 117.0, 64.0, 55.0, 43.0, 34.0, 38.0, 20.0, 19.0, 16.0, 11.0, 11.0, 14.0, 7.0, 6.0, 6.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.625, -82.9970703125, -80.369140625, -77.7412109375, -75.11328125, -72.4853515625, -69.857421875, -67.2294921875, -64.6015625, -61.9736328125, -59.345703125, -56.7177734375, -54.08984375, -51.4619140625, -48.833984375, -46.2060546875, -43.578125, -40.9501953125, -38.322265625, -35.6943359375, -33.06640625, -30.4384765625, -27.810546875, -25.1826171875, -22.5546875, -19.9267578125, -17.298828125, -14.6708984375, -12.04296875, -9.4150390625, -6.787109375, -4.1591796875, -1.53125, 1.0966796875, 3.724609375, 6.3525390625, 8.98046875, 11.6083984375, 14.236328125, 16.8642578125, 19.4921875, 22.1201171875, 24.748046875, 27.3759765625, 30.00390625, 32.6318359375, 35.259765625, 37.8876953125, 40.515625, 43.1435546875, 45.771484375, 48.3994140625, 51.02734375, 53.6552734375, 56.283203125, 58.9111328125, 61.5390625, 64.1669921875, 66.794921875, 69.4228515625, 72.05078125, 74.6787109375, 77.306640625, 79.9345703125, 82.5625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 6.0, 4.0, 4.0, 4.0, 5.0, 12.0, 10.0, 12.0, 0.0, 17.0, 4.0, 27.0, 23.0, 72.0, 51.0, 74.0, 104.0, 99.0, 169.0, 231.0, 287.0, 442.0, 566.0, 831.0, 1383.0, 2670.0, 4820.0, 10877.0, 33635.0, 5832726.0, 351219.0, 29581.0, 10219.0, 4439.0, 2397.0, 1510.0, 822.0, 545.0, 450.0, 296.0, 202.0, 124.0, 66.0, 76.0, 76.0, 65.0, 41.0, 33.0, 39.0, 14.0, 11.0, 18.0, 9.0, 1.0, 5.0, 7.0, 5.0, 4.0, 9.0, 2.0, 0.0, 3.0], "bins": [-441.75, -427.921875, -414.09375, -400.265625, -386.4375, -372.609375, -358.78125, -344.953125, -331.125, -317.296875, -303.46875, -289.640625, -275.8125, -261.984375, -248.15625, -234.328125, -220.5, -206.671875, -192.84375, -179.015625, -165.1875, -151.359375, -137.53125, -123.703125, -109.875, -96.046875, -82.21875, -68.390625, -54.5625, -40.734375, -26.90625, -13.078125, 0.75, 14.578125, 28.40625, 42.234375, 56.0625, 69.890625, 83.71875, 97.546875, 111.375, 125.203125, 139.03125, 152.859375, 166.6875, 180.515625, 194.34375, 208.171875, 222.0, 235.828125, 249.65625, 263.484375, 277.3125, 291.140625, 304.96875, 318.796875, 332.625, 346.453125, 360.28125, 374.109375, 387.9375, 401.765625, 415.59375, 429.421875, 443.25]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 3.0, 3.0, 8.0, 13.0, 13.0, 14.0, 16.0, 14.0, 23.0, 26.0, 41.0, 43.0, 86.0, 112.0, 822.0, 350.0, 110.0, 72.0, 47.0, 36.0, 28.0, 16.0, 11.0, 19.0, 14.0, 15.0, 10.0, 11.0, 4.0, 5.0, 10.0, 1.0, 6.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-171.0, -165.6171875, -160.234375, -154.8515625, -149.46875, -144.0859375, -138.703125, -133.3203125, -127.9375, -122.5546875, -117.171875, -111.7890625, -106.40625, -101.0234375, -95.640625, -90.2578125, -84.875, -79.4921875, -74.109375, -68.7265625, -63.34375, -57.9609375, -52.578125, -47.1953125, -41.8125, -36.4296875, -31.046875, -25.6640625, -20.28125, -14.8984375, -9.515625, -4.1328125, 1.25, 6.6328125, 12.015625, 17.3984375, 22.78125, 28.1640625, 33.546875, 38.9296875, 44.3125, 49.6953125, 55.078125, 60.4609375, 65.84375, 71.2265625, 76.609375, 81.9921875, 87.375, 92.7578125, 98.140625, 103.5234375, 108.90625, 114.2890625, 119.671875, 125.0546875, 130.4375, 135.8203125, 141.203125, 146.5859375, 151.96875, 157.3515625, 162.734375, 168.1171875, 173.5]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 11.0, 9.0, 21.0, 40.0, 806.0, 46.0, 21.0, 14.0, 13.0, 9.0, 2.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-514.5552368164062, -479.2791748046875, -444.0031433105469, -408.7270812988281, -373.4510498046875, -338.17498779296875, -302.89892578125, -267.62286376953125, -232.34683227539062, -197.07078552246094, -161.79473876953125, -126.5186767578125, -91.24263000488281, -55.966583251953125, -20.690521240234375, 14.585525512695312, 49.861572265625, 85.13761901855469, 120.4136734008789, 155.68972778320312, 190.9657745361328, 226.2418212890625, 261.51788330078125, 296.7939453125, 332.0699768066406, 367.3460388183594, 402.6220703125, 437.89813232421875, 473.1741943359375, 508.4502258300781, 543.726318359375, 579.0023193359375, 614.2783203125, 649.5543823242188, 684.8304443359375, 720.1064453125, 755.3825073242188, 790.6585693359375, 825.9346313476562, 861.210693359375, 896.4866943359375, 931.7627563476562, 967.038818359375, 1002.3148193359375, 1037.5909423828125, 1072.866943359375, 1108.14306640625, 1143.4190673828125, 1178.695068359375, 1213.9710693359375, 1249.2471923828125, 1284.523193359375, 1319.79931640625, 1355.0753173828125, 1390.351318359375, 1425.62744140625, 1460.903564453125, 1496.1795654296875, 1531.4556884765625, 1566.731689453125, 1602.0078125, 1637.2838134765625, 1672.559814453125, 1707.8359375, 1743.1119384765625]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 6.0, 0.0, 6.0, 6.0, 14.0, 13.0, 21.0, 17.0, 81.0, 703.0, 40.0, 20.0, 19.0, 14.0, 10.0, 8.0, 5.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-686.4974365234375, -655.87890625, -625.2603149414062, -594.6417846679688, -564.023193359375, -533.4046630859375, -502.7861022949219, -472.16754150390625, -441.54901123046875, -410.9304504394531, -380.3118896484375, -349.693359375, -319.0747985839844, -288.45623779296875, -257.8376770019531, -227.21913146972656, -196.60055541992188, -165.98199462890625, -135.3634490966797, -104.74488830566406, -74.12633514404297, -43.507781982421875, -12.88922119140625, 17.729324340820312, 48.34788513183594, 78.96643829345703, 109.58499145507812, 140.20355224609375, 170.82211303710938, 201.44065856933594, 232.05921936035156, 262.6777648925781, 293.29632568359375, 323.9148864746094, 354.533447265625, 385.1519775390625, 415.7705383300781, 446.38909912109375, 477.0076599121094, 507.626220703125, 538.2447509765625, 568.86328125, 599.4818725585938, 630.1004028320312, 660.718994140625, 691.3375244140625, 721.9560546875, 752.5746459960938, 783.1932373046875, 813.811767578125, 844.4303588867188, 875.0488891601562, 905.66748046875, 936.2860107421875, 966.904541015625, 997.5231323242188, 1028.1416015625, 1058.7601318359375, 1089.378662109375, 1119.997314453125, 1150.6158447265625, 1181.234375, 1211.8529052734375, 1242.471435546875, 1273.090087890625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 5.0, 3.0, 10.0, 15.0, 14.0, 24.0, 29.0, 38.0, 56.0, 66.0, 103.0, 126.0, 155.0, 238.0, 275.0, 401.0, 576.0, 900.0, 1757.0, 4010.0, 12523.0, 75798.0, 3800508.0, 257240.0, 23997.0, 7923.0, 3443.0, 1674.0, 898.0, 482.0, 302.0, 180.0, 146.0, 79.0, 64.0, 59.0, 38.0, 26.0, 26.0, 15.0, 18.0, 13.0, 6.0, 10.0, 6.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.90625, -9.5836181640625, -9.260986328125, -8.9383544921875, -8.61572265625, -8.2930908203125, -7.970458984375, -7.6478271484375, -7.3251953125, -7.0025634765625, -6.679931640625, -6.3572998046875, -6.03466796875, -5.7120361328125, -5.389404296875, -5.0667724609375, -4.744140625, -4.4215087890625, -4.098876953125, -3.7762451171875, -3.45361328125, -3.1309814453125, -2.808349609375, -2.4857177734375, -2.1630859375, -1.8404541015625, -1.517822265625, -1.1951904296875, -0.87255859375, -0.5499267578125, -0.227294921875, 0.0953369140625, 0.41796875, 0.7406005859375, 1.063232421875, 1.3858642578125, 1.70849609375, 2.0311279296875, 2.353759765625, 2.6763916015625, 2.9990234375, 3.3216552734375, 3.644287109375, 3.9669189453125, 4.28955078125, 4.6121826171875, 4.934814453125, 5.2574462890625, 5.580078125, 5.9027099609375, 6.225341796875, 6.5479736328125, 6.87060546875, 7.1932373046875, 7.515869140625, 7.8385009765625, 8.1611328125, 8.4837646484375, 8.806396484375, 9.1290283203125, 9.45166015625, 9.7742919921875, 10.096923828125, 10.4195556640625, 10.7421875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 8.0, 6.0, 10.0, 23.0, 65.0, 207.0, 315.0, 235.0, 84.0, 18.0, 9.0, 4.0, 7.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84033203125, -0.81195068359375, -0.7835693359375, -0.75518798828125, -0.726806640625, -0.69842529296875, -0.6700439453125, -0.64166259765625, -0.61328125, -0.58489990234375, -0.5565185546875, -0.52813720703125, -0.499755859375, -0.47137451171875, -0.4429931640625, -0.41461181640625, -0.38623046875, -0.35784912109375, -0.3294677734375, -0.30108642578125, -0.272705078125, -0.24432373046875, -0.2159423828125, -0.18756103515625, -0.1591796875, -0.13079833984375, -0.1024169921875, -0.07403564453125, -0.045654296875, -0.01727294921875, 0.0111083984375, 0.03948974609375, 0.06787109375, 0.09625244140625, 0.1246337890625, 0.15301513671875, 0.181396484375, 0.20977783203125, 0.2381591796875, 0.26654052734375, 0.294921875, 0.32330322265625, 0.3516845703125, 0.38006591796875, 0.408447265625, 0.43682861328125, 0.4652099609375, 0.49359130859375, 0.52197265625, 0.55035400390625, 0.5787353515625, 0.60711669921875, 0.635498046875, 0.66387939453125, 0.6922607421875, 0.72064208984375, 0.7490234375, 0.77740478515625, 0.8057861328125, 0.83416748046875, 0.862548828125, 0.89093017578125, 0.9193115234375, 0.94769287109375, 0.97607421875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 2.0, 5.0, 4.0, 5.0, 4.0, 17.0, 19.0, 35.0, 46.0, 66.0, 102.0, 185.0, 304.0, 716.0, 1827.0, 6537.0, 42582.0, 2728166.0, 1374640.0, 31599.0, 4807.0, 1331.0, 506.0, 262.0, 157.0, 87.0, 77.0, 55.0, 39.0, 23.0, 22.0, 17.0, 11.0, 6.0, 5.0, 4.0, 10.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.453125, -9.0892333984375, -8.725341796875, -8.3614501953125, -7.99755859375, -7.6336669921875, -7.269775390625, -6.9058837890625, -6.5419921875, -6.1781005859375, -5.814208984375, -5.4503173828125, -5.08642578125, -4.7225341796875, -4.358642578125, -3.9947509765625, -3.630859375, -3.2669677734375, -2.903076171875, -2.5391845703125, -2.17529296875, -1.8114013671875, -1.447509765625, -1.0836181640625, -0.7197265625, -0.3558349609375, 0.008056640625, 0.3719482421875, 0.73583984375, 1.0997314453125, 1.463623046875, 1.8275146484375, 2.19140625, 2.5552978515625, 2.919189453125, 3.2830810546875, 3.64697265625, 4.0108642578125, 4.374755859375, 4.7386474609375, 5.1025390625, 5.4664306640625, 5.830322265625, 6.1942138671875, 6.55810546875, 6.9219970703125, 7.285888671875, 7.6497802734375, 8.013671875, 8.3775634765625, 8.741455078125, 9.1053466796875, 9.46923828125, 9.8331298828125, 10.197021484375, 10.5609130859375, 10.9248046875, 11.2886962890625, 11.652587890625, 12.0164794921875, 12.38037109375, 12.7442626953125, 13.108154296875, 13.4720458984375, 13.8359375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 7.0, 5.0, 11.0, 11.0, 21.0, 16.0, 21.0, 28.0, 42.0, 46.0, 58.0, 68.0, 81.0, 98.0, 116.0, 159.0, 191.0, 234.0, 393.0, 1053.0, 488.0, 291.0, 190.0, 131.0, 88.0, 60.0, 39.0, 31.0, 20.0, 27.0, 13.0, 8.0, 8.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5654296875, -1.528564453125, -1.49169921875, -1.454833984375, -1.41796875, -1.381103515625, -1.34423828125, -1.307373046875, -1.2705078125, -1.233642578125, -1.19677734375, -1.159912109375, -1.123046875, -1.086181640625, -1.04931640625, -1.012451171875, -0.9755859375, -0.938720703125, -0.90185546875, -0.864990234375, -0.828125, -0.791259765625, -0.75439453125, -0.717529296875, -0.6806640625, -0.643798828125, -0.60693359375, -0.570068359375, -0.533203125, -0.496337890625, -0.45947265625, -0.422607421875, -0.3857421875, -0.348876953125, -0.31201171875, -0.275146484375, -0.23828125, -0.201416015625, -0.16455078125, -0.127685546875, -0.0908203125, -0.053955078125, -0.01708984375, 0.019775390625, 0.056640625, 0.093505859375, 0.13037109375, 0.167236328125, 0.2041015625, 0.240966796875, 0.27783203125, 0.314697265625, 0.3515625, 0.388427734375, 0.42529296875, 0.462158203125, 0.4990234375, 0.535888671875, 0.57275390625, 0.609619140625, 0.646484375, 0.683349609375, 0.72021484375, 0.757080078125, 0.7939453125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 9.0, 5.0, 16.0, 38.0, 108.0, 415.0, 396.0, 20.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.39115142822266, -105.54414367675781, -102.6971435546875, -99.85014343261719, -97.00313568115234, -94.1561279296875, -91.30912780761719, -88.46212768554688, -85.61511993408203, -82.76811218261719, -79.92111206054688, -77.07411193847656, -74.22710418701172, -71.38009643554688, -68.53309631347656, -65.68609619140625, -62.839088439941406, -59.99208450317383, -57.14508056640625, -54.29807662963867, -51.451072692871094, -48.604068756103516, -45.75706481933594, -42.91006088256836, -40.06305694580078, -37.2160530090332, -34.369049072265625, -31.522045135498047, -28.67504119873047, -25.82803726196289, -22.981033325195312, -20.134029388427734, -17.287017822265625, -14.440013885498047, -11.593009948730469, -8.74600601196289, -5.8990020751953125, -3.0519981384277344, -0.20499420166015625, 2.642009735107422, 5.489013671875, 8.336017608642578, 11.183021545410156, 14.030025482177734, 16.877029418945312, 19.72403335571289, 22.57103729248047, 25.418041229248047, 28.265045166015625, 31.112049102783203, 33.95905303955078, 36.80605697631836, 39.65306091308594, 42.500064849853516, 45.347068786621094, 48.19407272338867, 51.04107666015625, 53.88808059692383, 56.735084533691406, 59.582088470458984, 62.42909240722656, 65.27609252929688, 68.12310028076172, 70.97010803222656, 73.81710815429688]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 11.0, 16.0, 11.0, 25.0, 21.0, 29.0, 42.0, 60.0, 56.0, 86.0, 87.0, 78.0, 81.0, 67.0, 69.0, 63.0, 46.0, 40.0, 31.0, 24.0, 22.0, 13.0, 6.0, 8.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.537656784057617, -20.90022850036621, -20.262800216674805, -19.6253719329834, -18.987943649291992, -18.350515365600586, -17.71308708190918, -17.075660705566406, -16.438232421875, -15.800804138183594, -15.163375854492188, -14.525947570800781, -13.888519287109375, -13.251091003417969, -12.613663673400879, -11.976235389709473, -11.33880615234375, -10.701377868652344, -10.063949584960938, -9.426521301269531, -8.789093017578125, -8.151664733886719, -7.514237403869629, -6.876809120178223, -6.239380836486816, -5.60195255279541, -4.964524269104004, -4.327096462249756, -3.6896681785583496, -3.0522398948669434, -2.414811849594116, -1.777383804321289, -1.1399555206298828, -0.5025273561477661, 0.13490080833435059, 0.7723289728164673, 1.409757137298584, 2.0471854209899902, 2.6846134662628174, 3.3220415115356445, 3.959469795227051, 4.596898078918457, 5.234326362609863, 5.871754169464111, 6.509182453155518, 7.146610736846924, 7.784038543701172, 8.421466827392578, 9.058895111083984, 9.69632339477539, 10.333751678466797, 10.971179962158203, 11.60860824584961, 12.246036529541016, 12.883463859558105, 13.520892143249512, 14.158320426940918, 14.795748710632324, 15.43317699432373, 16.07060432434082, 16.708032608032227, 17.345460891723633, 17.98288917541504, 18.620317459106445, 19.25774574279785]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 1.0, 5.0, 6.0, 14.0, 13.0, 16.0, 16.0, 25.0, 39.0, 56.0, 77.0, 95.0, 143.0, 199.0, 321.0, 421.0, 681.0, 1135.0, 1989.0, 4096.0, 10933.0, 50954.0, 731118.0, 207730.0, 24333.0, 6898.0, 3009.0, 1533.0, 919.0, 549.0, 353.0, 260.0, 156.0, 133.0, 83.0, 56.0, 58.0, 38.0, 23.0, 22.0, 10.0, 18.0, 7.0, 8.0, 6.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.21875, -5.04925537109375, -4.8797607421875, -4.71026611328125, -4.540771484375, -4.37127685546875, -4.2017822265625, -4.03228759765625, -3.86279296875, -3.69329833984375, -3.5238037109375, -3.35430908203125, -3.184814453125, -3.01531982421875, -2.8458251953125, -2.67633056640625, -2.5068359375, -2.33734130859375, -2.1678466796875, -1.99835205078125, -1.828857421875, -1.65936279296875, -1.4898681640625, -1.32037353515625, -1.15087890625, -0.98138427734375, -0.8118896484375, -0.64239501953125, -0.472900390625, -0.30340576171875, -0.1339111328125, 0.03558349609375, 0.205078125, 0.37457275390625, 0.5440673828125, 0.71356201171875, 0.883056640625, 1.05255126953125, 1.2220458984375, 1.39154052734375, 1.56103515625, 1.73052978515625, 1.9000244140625, 2.06951904296875, 2.239013671875, 2.40850830078125, 2.5780029296875, 2.74749755859375, 2.9169921875, 3.08648681640625, 3.2559814453125, 3.42547607421875, 3.594970703125, 3.76446533203125, 3.9339599609375, 4.10345458984375, 4.27294921875, 4.44244384765625, 4.6119384765625, 4.78143310546875, 4.950927734375, 5.12042236328125, 5.2899169921875, 5.45941162109375, 5.62890625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 1.0, 7.0, 6.0, 8.0, 17.0, 25.0, 48.0, 85.0, 183.0, 202.0, 166.0, 114.0, 59.0, 31.0, 17.0, 12.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88671875, -0.8637466430664062, -0.8407745361328125, -0.8178024291992188, -0.794830322265625, -0.7718582153320312, -0.7488861083984375, -0.7259140014648438, -0.70294189453125, -0.6799697875976562, -0.6569976806640625, -0.6340255737304688, -0.611053466796875, -0.5880813598632812, -0.5651092529296875, -0.5421371459960938, -0.5191650390625, -0.49619293212890625, -0.4732208251953125, -0.45024871826171875, -0.427276611328125, -0.40430450439453125, -0.3813323974609375, -0.35836029052734375, -0.33538818359375, -0.31241607666015625, -0.2894439697265625, -0.26647186279296875, -0.243499755859375, -0.22052764892578125, -0.1975555419921875, -0.17458343505859375, -0.151611328125, -0.12863922119140625, -0.1056671142578125, -0.08269500732421875, -0.059722900390625, -0.03675079345703125, -0.0137786865234375, 0.00919342041015625, 0.03216552734375, 0.05513763427734375, 0.0781097412109375, 0.10108184814453125, 0.124053955078125, 0.14702606201171875, 0.1699981689453125, 0.19297027587890625, 0.2159423828125, 0.23891448974609375, 0.2618865966796875, 0.28485870361328125, 0.307830810546875, 0.33080291748046875, 0.3537750244140625, 0.37674713134765625, 0.39971923828125, 0.42269134521484375, 0.4456634521484375, 0.46863555908203125, 0.491607666015625, 0.5145797729492188, 0.5375518798828125, 0.5605239868164062, 0.58349609375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 10.0, 8.0, 14.0, 24.0, 27.0, 40.0, 87.0, 134.0, 240.0, 416.0, 904.0, 1740.0, 4821.0, 16949.0, 95991.0, 768425.0, 128282.0, 20750.0, 5559.0, 2061.0, 957.0, 470.0, 270.0, 144.0, 66.0, 38.0, 30.0, 23.0, 18.0, 14.0, 11.0, 7.0, 2.0, 8.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.9296875, -8.68548583984375, -8.4412841796875, -8.19708251953125, -7.952880859375, -7.70867919921875, -7.4644775390625, -7.22027587890625, -6.97607421875, -6.73187255859375, -6.4876708984375, -6.24346923828125, -5.999267578125, -5.75506591796875, -5.5108642578125, -5.26666259765625, -5.0224609375, -4.77825927734375, -4.5340576171875, -4.28985595703125, -4.045654296875, -3.80145263671875, -3.5572509765625, -3.31304931640625, -3.06884765625, -2.82464599609375, -2.5804443359375, -2.33624267578125, -2.092041015625, -1.84783935546875, -1.6036376953125, -1.35943603515625, -1.115234375, -0.87103271484375, -0.6268310546875, -0.38262939453125, -0.138427734375, 0.10577392578125, 0.3499755859375, 0.59417724609375, 0.83837890625, 1.08258056640625, 1.3267822265625, 1.57098388671875, 1.815185546875, 2.05938720703125, 2.3035888671875, 2.54779052734375, 2.7919921875, 3.03619384765625, 3.2803955078125, 3.52459716796875, 3.768798828125, 4.01300048828125, 4.2572021484375, 4.50140380859375, 4.74560546875, 4.98980712890625, 5.2340087890625, 5.47821044921875, 5.722412109375, 5.96661376953125, 6.2108154296875, 6.45501708984375, 6.69921875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 4.0, 4.0, 13.0, 14.0, 11.0, 12.0, 12.0, 23.0, 27.0, 16.0, 25.0, 40.0, 36.0, 41.0, 34.0, 40.0, 51.0, 45.0, 42.0, 48.0, 50.0, 40.0, 39.0, 50.0, 39.0, 48.0, 35.0, 24.0, 22.0, 15.0, 18.0, 16.0, 14.0, 12.0, 5.0, 8.0, 3.0, 5.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.283203125, -2.201019287109375, -2.11883544921875, -2.036651611328125, -1.9544677734375, -1.872283935546875, -1.79010009765625, -1.707916259765625, -1.625732421875, -1.543548583984375, -1.46136474609375, -1.379180908203125, -1.2969970703125, -1.214813232421875, -1.13262939453125, -1.050445556640625, -0.96826171875, -0.886077880859375, -0.80389404296875, -0.721710205078125, -0.6395263671875, -0.557342529296875, -0.47515869140625, -0.392974853515625, -0.310791015625, -0.228607177734375, -0.14642333984375, -0.064239501953125, 0.0179443359375, 0.100128173828125, 0.18231201171875, 0.264495849609375, 0.3466796875, 0.428863525390625, 0.51104736328125, 0.593231201171875, 0.6754150390625, 0.757598876953125, 0.83978271484375, 0.921966552734375, 1.004150390625, 1.086334228515625, 1.16851806640625, 1.250701904296875, 1.3328857421875, 1.415069580078125, 1.49725341796875, 1.579437255859375, 1.66162109375, 1.743804931640625, 1.82598876953125, 1.908172607421875, 1.9903564453125, 2.072540283203125, 2.15472412109375, 2.236907958984375, 2.319091796875, 2.401275634765625, 2.48345947265625, 2.565643310546875, 2.6478271484375, 2.730010986328125, 2.81219482421875, 2.894378662109375, 2.9765625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 4.0, 5.0, 6.0, 10.0, 20.0, 24.0, 39.0, 84.0, 156.0, 353.0, 1221.0, 12532.0, 1026197.0, 6375.0, 876.0, 315.0, 162.0, 63.0, 45.0, 21.0, 18.0, 7.0, 2.0, 7.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-43.9375, -42.6962890625, -41.455078125, -40.2138671875, -38.97265625, -37.7314453125, -36.490234375, -35.2490234375, -34.0078125, -32.7666015625, -31.525390625, -30.2841796875, -29.04296875, -27.8017578125, -26.560546875, -25.3193359375, -24.078125, -22.8369140625, -21.595703125, -20.3544921875, -19.11328125, -17.8720703125, -16.630859375, -15.3896484375, -14.1484375, -12.9072265625, -11.666015625, -10.4248046875, -9.18359375, -7.9423828125, -6.701171875, -5.4599609375, -4.21875, -2.9775390625, -1.736328125, -0.4951171875, 0.74609375, 1.9873046875, 3.228515625, 4.4697265625, 5.7109375, 6.9521484375, 8.193359375, 9.4345703125, 10.67578125, 11.9169921875, 13.158203125, 14.3994140625, 15.640625, 16.8818359375, 18.123046875, 19.3642578125, 20.60546875, 21.8466796875, 23.087890625, 24.3291015625, 25.5703125, 26.8115234375, 28.052734375, 29.2939453125, 30.53515625, 31.7763671875, 33.017578125, 34.2587890625, 35.5]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 12.0, 20.0, 45.0, 125.0, 281.0, 296.0, 104.0, 54.0, 23.0, 13.0, 8.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003864765167236328, -0.00036073848605155945, -0.0003350004553794861, -0.0003092624247074127, -0.00028352439403533936, -0.000257786363363266, -0.00023204833269119263, -0.00020631030201911926, -0.0001805722713470459, -0.00015483424067497253, -0.00012909621000289917, -0.0001033581793308258, -7.762014865875244e-05, -5.188211798667908e-05, -2.6144087314605713e-05, -4.0605664253234863e-07, 2.5331974029541016e-05, 5.107000470161438e-05, 7.680803537368774e-05, 0.00010254606604576111, 0.00012828409671783447, 0.00015402212738990784, 0.0001797601580619812, 0.00020549818873405457, 0.00023123621940612793, 0.0002569742500782013, 0.00028271228075027466, 0.000308450311422348, 0.0003341883420944214, 0.00035992637276649475, 0.0003856644034385681, 0.0004114024341106415, 0.00043714046478271484, 0.0004628784954547882, 0.0004886165261268616, 0.0005143545567989349, 0.0005400925874710083, 0.0005658306181430817, 0.000591568648815155, 0.0006173066794872284, 0.0006430447101593018, 0.0006687827408313751, 0.0006945207715034485, 0.0007202588021755219, 0.0007459968328475952, 0.0007717348635196686, 0.0007974728941917419, 0.0008232109248638153, 0.0008489489555358887, 0.000874686986207962, 0.0009004250168800354, 0.0009261630475521088, 0.0009519010782241821, 0.0009776391088962555, 0.0010033771395683289, 0.0010291151702404022, 0.0010548532009124756, 0.001080591231584549, 0.0011063292622566223, 0.0011320672929286957, 0.001157805323600769, 0.0011835433542728424, 0.0012092813849449158, 0.0012350194156169891, 0.0012607574462890625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 6.0, 5.0, 8.0, 6.0, 11.0, 24.0, 31.0, 50.0, 81.0, 125.0, 267.0, 580.0, 1614.0, 5305.0, 50522.0, 960765.0, 23093.0, 3897.0, 1153.0, 474.0, 210.0, 129.0, 90.0, 49.0, 22.0, 11.0, 7.0, 7.0, 5.0, 5.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0], "bins": [-17.5, -17.0665283203125, -16.633056640625, -16.1995849609375, -15.76611328125, -15.3326416015625, -14.899169921875, -14.4656982421875, -14.0322265625, -13.5987548828125, -13.165283203125, -12.7318115234375, -12.29833984375, -11.8648681640625, -11.431396484375, -10.9979248046875, -10.564453125, -10.1309814453125, -9.697509765625, -9.2640380859375, -8.83056640625, -8.3970947265625, -7.963623046875, -7.5301513671875, -7.0966796875, -6.6632080078125, -6.229736328125, -5.7962646484375, -5.36279296875, -4.9293212890625, -4.495849609375, -4.0623779296875, -3.62890625, -3.1954345703125, -2.761962890625, -2.3284912109375, -1.89501953125, -1.4615478515625, -1.028076171875, -0.5946044921875, -0.1611328125, 0.2723388671875, 0.705810546875, 1.1392822265625, 1.57275390625, 2.0062255859375, 2.439697265625, 2.8731689453125, 3.306640625, 3.7401123046875, 4.173583984375, 4.6070556640625, 5.04052734375, 5.4739990234375, 5.907470703125, 6.3409423828125, 6.7744140625, 7.2078857421875, 7.641357421875, 8.0748291015625, 8.50830078125, 8.9417724609375, 9.375244140625, 9.8087158203125, 10.2421875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 0.0, 3.0, 7.0, 15.0, 26.0, 31.0, 53.0, 121.0, 240.0, 212.0, 126.0, 78.0, 40.0, 17.0, 10.0, 8.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6328125, -4.4324951171875, -4.232177734375, -4.0318603515625, -3.83154296875, -3.6312255859375, -3.430908203125, -3.2305908203125, -3.0302734375, -2.8299560546875, -2.629638671875, -2.4293212890625, -2.22900390625, -2.0286865234375, -1.828369140625, -1.6280517578125, -1.427734375, -1.2274169921875, -1.027099609375, -0.8267822265625, -0.62646484375, -0.4261474609375, -0.225830078125, -0.0255126953125, 0.1748046875, 0.3751220703125, 0.575439453125, 0.7757568359375, 0.97607421875, 1.1763916015625, 1.376708984375, 1.5770263671875, 1.77734375, 1.9776611328125, 2.177978515625, 2.3782958984375, 2.57861328125, 2.7789306640625, 2.979248046875, 3.1795654296875, 3.3798828125, 3.5802001953125, 3.780517578125, 3.9808349609375, 4.18115234375, 4.3814697265625, 4.581787109375, 4.7821044921875, 4.982421875, 5.1827392578125, 5.383056640625, 5.5833740234375, 5.78369140625, 5.9840087890625, 6.184326171875, 6.3846435546875, 6.5849609375, 6.7852783203125, 6.985595703125, 7.1859130859375, 7.38623046875, 7.5865478515625, 7.786865234375, 7.9871826171875, 8.1875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 4.0, 6.0, 7.0, 14.0, 19.0, 24.0, 55.0, 112.0, 232.0, 329.0, 126.0, 38.0, 14.0, 7.0, 7.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-73.98529052734375, -71.69825744628906, -69.4112319946289, -67.12419891357422, -64.83717346191406, -62.550140380859375, -60.26310729980469, -57.976078033447266, -55.689048767089844, -53.40201950073242, -51.114990234375, -48.82795715332031, -46.54092788696289, -44.25389862060547, -41.96686553955078, -39.67983627319336, -37.39280700683594, -35.105777740478516, -32.818748474121094, -30.531715393066406, -28.244686126708984, -25.957656860351562, -23.670625686645508, -21.383594512939453, -19.09656524658203, -16.80953598022461, -14.522504806518555, -12.235474586486816, -9.948444366455078, -7.66141414642334, -5.374383926391602, -3.087352752685547, -0.8003311157226562, 1.486699104309082, 3.7737293243408203, 6.060759544372559, 8.347789764404297, 10.634819984436035, 12.921850204467773, 15.208881378173828, 17.49591064453125, 19.782939910888672, 22.069971084594727, 24.35700225830078, 26.644031524658203, 28.931060791015625, 31.21809196472168, 33.505123138427734, 35.792152404785156, 38.07918167114258, 40.3662109375, 42.65324401855469, 44.94027328491211, 47.22730255126953, 49.51433563232422, 51.80136489868164, 54.08839416503906, 56.375423431396484, 58.662452697753906, 60.949485778808594, 63.236515045166016, 65.52354431152344, 67.81057739257812, 70.09761047363281, 72.38463592529297]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 8.0, 4.0, 10.0, 4.0, 14.0, 32.0, 41.0, 57.0, 86.0, 123.0, 115.0, 131.0, 108.0, 90.0, 54.0, 42.0, 31.0, 16.0, 9.0, 10.0, 5.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-47.24704360961914, -45.559181213378906, -43.871315002441406, -42.18345260620117, -40.49559020996094, -38.80772399902344, -37.1198616027832, -35.43199920654297, -33.744136810302734, -32.0562744140625, -30.368410110473633, -28.680545806884766, -26.99268341064453, -25.304819107055664, -23.616954803466797, -21.929092407226562, -20.241228103637695, -18.553363800048828, -16.865501403808594, -15.177637100219727, -13.489774703979492, -11.801910400390625, -10.114047050476074, -8.426183700561523, -6.738320350646973, -5.050457000732422, -3.362593412399292, -1.674729824066162, 0.013133525848388672, 1.7009973526000977, 3.3888607025146484, 5.076724052429199, 6.76458740234375, 8.4524507522583, 10.140314102172852, 11.828178405761719, 13.516040802001953, 15.20390510559082, 16.891769409179688, 18.579631805419922, 20.267494201660156, 21.955358505249023, 23.643220901489258, 25.331085205078125, 27.01894760131836, 28.706811904907227, 30.394676208496094, 32.08253860473633, 33.77040100097656, 35.4582633972168, 37.1461296081543, 38.83399200439453, 40.521854400634766, 42.209716796875, 43.8975830078125, 45.585445404052734, 47.273311614990234, 48.96117401123047, 50.64904022216797, 52.3369026184082, 54.02476501464844, 55.71263122558594, 57.40049362182617, 59.088356018066406, 60.77621841430664]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 8.0, 9.0, 19.0, 42.0, 158.0, 9873.0, 4183072.0, 853.0, 150.0, 36.0, 24.0, 12.0, 13.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-224.875, -215.595703125, -206.31640625, -197.037109375, -187.7578125, -178.478515625, -169.19921875, -159.919921875, -150.640625, -141.361328125, -132.08203125, -122.802734375, -113.5234375, -104.244140625, -94.96484375, -85.685546875, -76.40625, -67.126953125, -57.84765625, -48.568359375, -39.2890625, -30.009765625, -20.73046875, -11.451171875, -2.171875, 7.107421875, 16.38671875, 25.666015625, 34.9453125, 44.224609375, 53.50390625, 62.783203125, 72.0625, 81.341796875, 90.62109375, 99.900390625, 109.1796875, 118.458984375, 127.73828125, 137.017578125, 146.296875, 155.576171875, 164.85546875, 174.134765625, 183.4140625, 192.693359375, 201.97265625, 211.251953125, 220.53125, 229.810546875, 239.08984375, 248.369140625, 257.6484375, 266.927734375, 276.20703125, 285.486328125, 294.765625, 304.044921875, 313.32421875, 322.603515625, 331.8828125, 341.162109375, 350.44140625, 359.720703125, 369.0]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 3.0, 0.0, 3.0, 5.0, 4.0, 13.0, 7.0, 32.0, 36.0, 38.0, 49.0, 74.0, 71.0, 89.0, 114.0, 82.0, 77.0, 65.0, 60.0, 38.0, 37.0, 25.0, 19.0, 12.0, 8.0, 14.0, 4.0, 4.0, 4.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.5302734375, -0.5158271789550781, -0.5013809204101562, -0.4869346618652344, -0.4724884033203125, -0.4580421447753906, -0.44359588623046875, -0.4291496276855469, -0.414703369140625, -0.4002571105957031, -0.38581085205078125, -0.3713645935058594, -0.3569183349609375, -0.3424720764160156, -0.32802581787109375, -0.3135795593261719, -0.29913330078125, -0.2846870422363281, -0.27024078369140625, -0.2557945251464844, -0.2413482666015625, -0.22690200805664062, -0.21245574951171875, -0.19800949096679688, -0.183563232421875, -0.16911697387695312, -0.15467071533203125, -0.14022445678710938, -0.1257781982421875, -0.11133193969726562, -0.09688568115234375, -0.08243942260742188, -0.0679931640625, -0.053546905517578125, -0.03910064697265625, -0.024654388427734375, -0.0102081298828125, 0.004238128662109375, 0.01868438720703125, 0.033130645751953125, 0.047576904296875, 0.062023162841796875, 0.07646942138671875, 0.09091567993164062, 0.1053619384765625, 0.11980819702148438, 0.13425445556640625, 0.14870071411132812, 0.16314697265625, 0.17759323120117188, 0.19203948974609375, 0.20648574829101562, 0.2209320068359375, 0.23537826538085938, 0.24982452392578125, 0.2642707824707031, 0.278717041015625, 0.2931632995605469, 0.30760955810546875, 0.3220558166503906, 0.3365020751953125, 0.3509483337402344, 0.36539459228515625, 0.3798408508300781, 0.394287109375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 11.0, 8.0, 34.0, 41.0, 100.0, 172.0, 289.0, 554.0, 55501.0, 4136944.0, 506.0, 101.0, 21.0, 5.0, 2.0], "bins": [-192.5, -189.189453125, -185.87890625, -182.568359375, -179.2578125, -175.947265625, -172.63671875, -169.326171875, -166.015625, -162.705078125, -159.39453125, -156.083984375, -152.7734375, -149.462890625, -146.15234375, -142.841796875, -139.53125, -136.220703125, -132.91015625, -129.599609375, -126.2890625, -122.978515625, -119.66796875, -116.357421875, -113.046875, -109.736328125, -106.42578125, -103.115234375, -99.8046875, -96.494140625, -93.18359375, -89.873046875, -86.5625, -83.251953125, -79.94140625, -76.630859375, -73.3203125, -70.009765625, -66.69921875, -63.388671875, -60.078125, -56.767578125, -53.45703125, -50.146484375, -46.8359375, -43.525390625, -40.21484375, -36.904296875, -33.59375, -30.283203125, -26.97265625, -23.662109375, -20.3515625, -17.041015625, -13.73046875, -10.419921875, -7.109375, -3.798828125, -0.48828125, 2.822265625, 6.1328125, 9.443359375, 12.75390625, 16.064453125, 19.375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 11.0, 9.0, 12.0, 20.0, 25.0, 45.0, 50.0, 69.0, 154.0, 261.0, 459.0, 1280.0, 1006.0, 310.0, 141.0, 68.0, 44.0, 39.0, 24.0, 21.0, 6.0, 1.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.486328125, -1.4450225830078125, -1.403717041015625, -1.3624114990234375, -1.32110595703125, -1.2798004150390625, -1.238494873046875, -1.1971893310546875, -1.1558837890625, -1.1145782470703125, -1.073272705078125, -1.0319671630859375, -0.99066162109375, -0.9493560791015625, -0.908050537109375, -0.8667449951171875, -0.825439453125, -0.7841339111328125, -0.742828369140625, -0.7015228271484375, -0.66021728515625, -0.6189117431640625, -0.577606201171875, -0.5363006591796875, -0.4949951171875, -0.4536895751953125, -0.412384033203125, -0.3710784912109375, -0.32977294921875, -0.2884674072265625, -0.247161865234375, -0.2058563232421875, -0.16455078125, -0.1232452392578125, -0.081939697265625, -0.0406341552734375, 0.00067138671875, 0.0419769287109375, 0.083282470703125, 0.1245880126953125, 0.1658935546875, 0.2071990966796875, 0.248504638671875, 0.2898101806640625, 0.33111572265625, 0.3724212646484375, 0.413726806640625, 0.4550323486328125, 0.496337890625, 0.5376434326171875, 0.578948974609375, 0.6202545166015625, 0.66156005859375, 0.7028656005859375, 0.744171142578125, 0.7854766845703125, 0.8267822265625, 0.8680877685546875, 0.909393310546875, 0.9506988525390625, 0.99200439453125, 1.0333099365234375, 1.074615478515625, 1.1159210205078125, 1.1572265625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 10.0, 131.0, 874.0, 6.0], "bins": [-796.6268920898438, -783.8317260742188, -771.0365600585938, -758.241455078125, -745.4462890625, -732.651123046875, -719.85595703125, -707.060791015625, -694.265625, -681.470458984375, -668.67529296875, -655.880126953125, -643.0850219726562, -630.2898559570312, -617.4946899414062, -604.6995239257812, -591.9044189453125, -579.1092529296875, -566.3140869140625, -553.5189208984375, -540.7238159179688, -527.9286499023438, -515.1334838867188, -502.33831787109375, -489.54315185546875, -476.74798583984375, -463.9528503417969, -451.1576843261719, -438.3625183105469, -425.5673828125, -412.772216796875, -399.97705078125, -387.18194580078125, -374.38677978515625, -361.5916442871094, -348.7964782714844, -336.0013122558594, -323.2061767578125, -310.4110107421875, -297.6158447265625, -284.8206787109375, -272.0255126953125, -259.2303771972656, -246.43521118164062, -233.6400604248047, -220.84490966796875, -208.04974365234375, -195.2545928955078, -182.45944213867188, -169.66429138183594, -156.86912536621094, -144.073974609375, -131.27882385253906, -118.4836654663086, -105.68850708007812, -92.89335632324219, -80.09820556640625, -67.30304718017578, -54.507896423339844, -41.712738037109375, -28.917583465576172, -16.12242889404297, -3.3272705078125, 9.467880249023438, 22.263042449951172]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 10.0, 11.0, 27.0, 37.0, 66.0, 139.0, 152.0, 180.0, 150.0, 104.0, 57.0, 37.0, 19.0, 11.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-49.45118713378906, -48.48410415649414, -47.51702117919922, -46.5499382019043, -45.582855224609375, -44.61577224731445, -43.64868927001953, -42.68160629272461, -41.71452331542969, -40.747440338134766, -39.780357360839844, -38.81327438354492, -37.84619140625, -36.87910842895508, -35.912025451660156, -34.944942474365234, -33.97785949707031, -33.01077651977539, -32.04369354248047, -31.076610565185547, -30.109527587890625, -29.142444610595703, -28.17536163330078, -27.20827865600586, -26.241199493408203, -25.27411651611328, -24.30703353881836, -23.339950561523438, -22.372867584228516, -21.405784606933594, -20.438701629638672, -19.47161865234375, -18.504535675048828, -17.537452697753906, -16.570369720458984, -15.603286743164062, -14.63620376586914, -13.669120788574219, -12.702038764953613, -11.734955787658691, -10.767871856689453, -9.800788879394531, -8.83370590209961, -7.866623401641846, -6.899540424346924, -5.932457447052002, -4.965374946594238, -3.9982919692993164, -3.0312089920043945, -2.0641260147094727, -1.0970432758331299, -0.1299605369567871, 0.8371224403381348, 1.8042054176330566, 2.7712879180908203, 3.738370895385742, 4.705453872680664, 5.672536849975586, 6.639619827270508, 7.6067023277282715, 8.573785781860352, 9.540868759155273, 10.507950782775879, 11.4750337600708, 12.442116737365723]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 5.0, 5.0, 13.0, 6.0, 12.0, 18.0, 43.0, 42.0, 67.0, 116.0, 168.0, 283.0, 435.0, 702.0, 1250.0, 2173.0, 4005.0, 7722.0, 16736.0, 37442.0, 98208.0, 387105.0, 336588.0, 89766.0, 34172.0, 15275.0, 7396.0, 3753.0, 2065.0, 1141.0, 674.0, 401.0, 260.0, 155.0, 134.0, 71.0, 53.0, 22.0, 27.0, 18.0, 11.0, 11.0, 3.0, 4.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.470703125, -3.365386962890625, -3.26007080078125, -3.154754638671875, -3.0494384765625, -2.944122314453125, -2.83880615234375, -2.733489990234375, -2.628173828125, -2.522857666015625, -2.41754150390625, -2.312225341796875, -2.2069091796875, -2.101593017578125, -1.99627685546875, -1.890960693359375, -1.78564453125, -1.680328369140625, -1.57501220703125, -1.469696044921875, -1.3643798828125, -1.259063720703125, -1.15374755859375, -1.048431396484375, -0.943115234375, -0.837799072265625, -0.73248291015625, -0.627166748046875, -0.5218505859375, -0.416534423828125, -0.31121826171875, -0.205902099609375, -0.1005859375, 0.004730224609375, 0.11004638671875, 0.215362548828125, 0.3206787109375, 0.425994873046875, 0.53131103515625, 0.636627197265625, 0.741943359375, 0.847259521484375, 0.95257568359375, 1.057891845703125, 1.1632080078125, 1.268524169921875, 1.37384033203125, 1.479156494140625, 1.58447265625, 1.689788818359375, 1.79510498046875, 1.900421142578125, 2.0057373046875, 2.111053466796875, 2.21636962890625, 2.321685791015625, 2.427001953125, 2.532318115234375, 2.63763427734375, 2.742950439453125, 2.8482666015625, 2.953582763671875, 3.05889892578125, 3.164215087890625, 3.26953125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 15.0, 17.0, 16.0, 28.0, 43.0, 40.0, 46.0, 55.0, 66.0, 78.0, 64.0, 74.0, 54.0, 62.0, 53.0, 51.0, 35.0, 37.0, 37.0, 23.0, 25.0, 18.0, 12.0, 9.0, 10.0, 5.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3505859375, -0.3387260437011719, -0.32686614990234375, -0.3150062561035156, -0.3031463623046875, -0.2912864685058594, -0.27942657470703125, -0.2675666809082031, -0.255706787109375, -0.24384689331054688, -0.23198699951171875, -0.22012710571289062, -0.2082672119140625, -0.19640731811523438, -0.18454742431640625, -0.17268753051757812, -0.16082763671875, -0.14896774291992188, -0.13710784912109375, -0.12524795532226562, -0.1133880615234375, -0.10152816772460938, -0.08966827392578125, -0.07780838012695312, -0.065948486328125, -0.054088592529296875, -0.04222869873046875, -0.030368804931640625, -0.0185089111328125, -0.006649017333984375, 0.00521087646484375, 0.017070770263671875, 0.0289306640625, 0.040790557861328125, 0.05265045166015625, 0.06451034545898438, 0.0763702392578125, 0.08823013305664062, 0.10009002685546875, 0.11194992065429688, 0.123809814453125, 0.13566970825195312, 0.14752960205078125, 0.15938949584960938, 0.1712493896484375, 0.18310928344726562, 0.19496917724609375, 0.20682907104492188, 0.21868896484375, 0.23054885864257812, 0.24240875244140625, 0.2542686462402344, 0.2661285400390625, 0.2779884338378906, 0.28984832763671875, 0.3017082214355469, 0.313568115234375, 0.3254280090332031, 0.33728790283203125, 0.3491477966308594, 0.3610076904296875, 0.3728675842285156, 0.38472747802734375, 0.3965873718261719, 0.408447265625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 11.0, 19.0, 52.0, 297.0, 4264.0, 1001660.0, 41384.0, 685.0, 109.0, 32.0, 6.0, 2.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.25, -23.460205078125, -22.67041015625, -21.880615234375, -21.0908203125, -20.301025390625, -19.51123046875, -18.721435546875, -17.931640625, -17.141845703125, -16.35205078125, -15.562255859375, -14.7724609375, -13.982666015625, -13.19287109375, -12.403076171875, -11.61328125, -10.823486328125, -10.03369140625, -9.243896484375, -8.4541015625, -7.664306640625, -6.87451171875, -6.084716796875, -5.294921875, -4.505126953125, -3.71533203125, -2.925537109375, -2.1357421875, -1.345947265625, -0.55615234375, 0.233642578125, 1.0234375, 1.813232421875, 2.60302734375, 3.392822265625, 4.1826171875, 4.972412109375, 5.76220703125, 6.552001953125, 7.341796875, 8.131591796875, 8.92138671875, 9.711181640625, 10.5009765625, 11.290771484375, 12.08056640625, 12.870361328125, 13.66015625, 14.449951171875, 15.23974609375, 16.029541015625, 16.8193359375, 17.609130859375, 18.39892578125, 19.188720703125, 19.978515625, 20.768310546875, 21.55810546875, 22.347900390625, 23.1376953125, 23.927490234375, 24.71728515625, 25.507080078125, 26.296875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 3.0, 5.0, 9.0, 10.0, 22.0, 28.0, 18.0, 25.0, 20.0, 16.0, 26.0, 31.0, 35.0, 49.0, 49.0, 43.0, 46.0, 51.0, 61.0, 54.0, 52.0, 47.0, 45.0, 28.0, 37.0, 28.0, 21.0, 19.0, 17.0, 20.0, 12.0, 13.0, 8.0, 9.0, 6.0, 11.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.572265625, -1.5200347900390625, -1.467803955078125, -1.4155731201171875, -1.36334228515625, -1.3111114501953125, -1.258880615234375, -1.2066497802734375, -1.1544189453125, -1.1021881103515625, -1.049957275390625, -0.9977264404296875, -0.94549560546875, -0.8932647705078125, -0.841033935546875, -0.7888031005859375, -0.736572265625, -0.6843414306640625, -0.632110595703125, -0.5798797607421875, -0.52764892578125, -0.4754180908203125, -0.423187255859375, -0.3709564208984375, -0.3187255859375, -0.2664947509765625, -0.214263916015625, -0.1620330810546875, -0.10980224609375, -0.0575714111328125, -0.005340576171875, 0.0468902587890625, 0.09912109375, 0.1513519287109375, 0.203582763671875, 0.2558135986328125, 0.30804443359375, 0.3602752685546875, 0.412506103515625, 0.4647369384765625, 0.5169677734375, 0.5691986083984375, 0.621429443359375, 0.6736602783203125, 0.72589111328125, 0.7781219482421875, 0.830352783203125, 0.8825836181640625, 0.934814453125, 0.9870452880859375, 1.039276123046875, 1.0915069580078125, 1.14373779296875, 1.1959686279296875, 1.248199462890625, 1.3004302978515625, 1.3526611328125, 1.4048919677734375, 1.457122802734375, 1.5093536376953125, 1.56158447265625, 1.6138153076171875, 1.666046142578125, 1.7182769775390625, 1.7705078125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 1.0, 7.0, 15.0, 31.0, 64.0, 276.0, 4472.0, 1041961.0, 1481.0, 168.0, 44.0, 12.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-92.9375, -90.841796875, -88.74609375, -86.650390625, -84.5546875, -82.458984375, -80.36328125, -78.267578125, -76.171875, -74.076171875, -71.98046875, -69.884765625, -67.7890625, -65.693359375, -63.59765625, -61.501953125, -59.40625, -57.310546875, -55.21484375, -53.119140625, -51.0234375, -48.927734375, -46.83203125, -44.736328125, -42.640625, -40.544921875, -38.44921875, -36.353515625, -34.2578125, -32.162109375, -30.06640625, -27.970703125, -25.875, -23.779296875, -21.68359375, -19.587890625, -17.4921875, -15.396484375, -13.30078125, -11.205078125, -9.109375, -7.013671875, -4.91796875, -2.822265625, -0.7265625, 1.369140625, 3.46484375, 5.560546875, 7.65625, 9.751953125, 11.84765625, 13.943359375, 16.0390625, 18.134765625, 20.23046875, 22.326171875, 24.421875, 26.517578125, 28.61328125, 30.708984375, 32.8046875, 34.900390625, 36.99609375, 39.091796875, 41.1875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 5.0, 6.0, 9.0, 9.0, 17.0, 16.0, 16.0, 38.0, 48.0, 102.0, 137.0, 175.0, 147.0, 109.0, 50.0, 42.0, 23.0, 12.0, 11.0, 6.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003783702850341797, -0.00036741793155670166, -0.00035646557807922363, -0.0003455132246017456, -0.0003345608711242676, -0.00032360851764678955, -0.0003126561641693115, -0.0003017038106918335, -0.00029075145721435547, -0.00027979910373687744, -0.0002688467502593994, -0.0002578943967819214, -0.00024694204330444336, -0.00023598968982696533, -0.0002250373363494873, -0.00021408498287200928, -0.00020313262939453125, -0.00019218027591705322, -0.0001812279224395752, -0.00017027556896209717, -0.00015932321548461914, -0.0001483708620071411, -0.00013741850852966309, -0.00012646615505218506, -0.00011551380157470703, -0.000104561448097229, -9.360909461975098e-05, -8.265674114227295e-05, -7.170438766479492e-05, -6.0752034187316895e-05, -4.979968070983887e-05, -3.884732723236084e-05, -2.7894973754882812e-05, -1.6942620277404785e-05, -5.990266799926758e-06, 4.9620866775512695e-06, 1.5914440155029297e-05, 2.6866793632507324e-05, 3.781914710998535e-05, 4.877150058746338e-05, 5.9723854064941406e-05, 7.067620754241943e-05, 8.162856101989746e-05, 9.258091449737549e-05, 0.00010353326797485352, 0.00011448562145233154, 0.00012543797492980957, 0.0001363903284072876, 0.00014734268188476562, 0.00015829503536224365, 0.00016924738883972168, 0.0001801997423171997, 0.00019115209579467773, 0.00020210444927215576, 0.0002130568027496338, 0.00022400915622711182, 0.00023496150970458984, 0.00024591386318206787, 0.0002568662166595459, 0.0002678185701370239, 0.00027877092361450195, 0.00028972327709198, 0.000300675630569458, 0.00031162798404693604, 0.00032258033752441406]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 12.0, 8.0, 14.0, 16.0, 22.0, 41.0, 68.0, 125.0, 246.0, 363.0, 730.0, 1464.0, 3415.0, 10832.0, 80305.0, 860577.0, 73607.0, 10448.0, 3208.0, 1381.0, 681.0, 360.0, 242.0, 131.0, 88.0, 41.0, 41.0, 21.0, 8.0, 15.0, 15.0, 5.0, 3.0, 8.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.87109375, -6.65283203125, -6.4345703125, -6.21630859375, -5.998046875, -5.77978515625, -5.5615234375, -5.34326171875, -5.125, -4.90673828125, -4.6884765625, -4.47021484375, -4.251953125, -4.03369140625, -3.8154296875, -3.59716796875, -3.37890625, -3.16064453125, -2.9423828125, -2.72412109375, -2.505859375, -2.28759765625, -2.0693359375, -1.85107421875, -1.6328125, -1.41455078125, -1.1962890625, -0.97802734375, -0.759765625, -0.54150390625, -0.3232421875, -0.10498046875, 0.11328125, 0.33154296875, 0.5498046875, 0.76806640625, 0.986328125, 1.20458984375, 1.4228515625, 1.64111328125, 1.859375, 2.07763671875, 2.2958984375, 2.51416015625, 2.732421875, 2.95068359375, 3.1689453125, 3.38720703125, 3.60546875, 3.82373046875, 4.0419921875, 4.26025390625, 4.478515625, 4.69677734375, 4.9150390625, 5.13330078125, 5.3515625, 5.56982421875, 5.7880859375, 6.00634765625, 6.224609375, 6.44287109375, 6.6611328125, 6.87939453125, 7.09765625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 13.0, 16.0, 16.0, 33.0, 61.0, 129.0, 213.0, 218.0, 119.0, 71.0, 37.0, 19.0, 17.0, 10.0, 5.0, 8.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.904296875, -2.783355712890625, -2.66241455078125, -2.541473388671875, -2.4205322265625, -2.299591064453125, -2.17864990234375, -2.057708740234375, -1.936767578125, -1.815826416015625, -1.69488525390625, -1.573944091796875, -1.4530029296875, -1.332061767578125, -1.21112060546875, -1.090179443359375, -0.96923828125, -0.848297119140625, -0.72735595703125, -0.606414794921875, -0.4854736328125, -0.364532470703125, -0.24359130859375, -0.122650146484375, -0.001708984375, 0.119232177734375, 0.24017333984375, 0.361114501953125, 0.4820556640625, 0.602996826171875, 0.72393798828125, 0.844879150390625, 0.9658203125, 1.086761474609375, 1.20770263671875, 1.328643798828125, 1.4495849609375, 1.570526123046875, 1.69146728515625, 1.812408447265625, 1.933349609375, 2.054290771484375, 2.17523193359375, 2.296173095703125, 2.4171142578125, 2.538055419921875, 2.65899658203125, 2.779937744140625, 2.90087890625, 3.021820068359375, 3.14276123046875, 3.263702392578125, 3.3846435546875, 3.505584716796875, 3.62652587890625, 3.747467041015625, 3.868408203125, 3.989349365234375, 4.11029052734375, 4.231231689453125, 4.3521728515625, 4.473114013671875, 4.59405517578125, 4.714996337890625, 4.8359375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 13.0, 21.0, 71.0, 174.0, 396.0, 219.0, 65.0, 22.0, 16.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-48.78337860107422, -47.2387809753418, -45.69417953491211, -44.14958190917969, -42.60498046875, -41.06038284301758, -39.515785217285156, -37.97118377685547, -36.42658615112305, -34.881988525390625, -33.33738708496094, -31.792789459228516, -30.24818992614746, -28.703590393066406, -27.158992767333984, -25.61439323425293, -24.069793701171875, -22.52519416809082, -20.980594635009766, -19.435997009277344, -17.89139747619629, -16.346797943115234, -14.802199363708496, -13.257600784301758, -11.713001251220703, -10.168401718139648, -8.62380313873291, -7.079204082489014, -5.534605026245117, -3.9900059700012207, -2.445406913757324, -0.9008083343505859, 0.6437911987304688, 2.1883902549743652, 3.7329893112182617, 5.277588367462158, 6.822187423706055, 8.36678695678711, 9.911385536193848, 11.455984115600586, 13.00058364868164, 14.545183181762695, 16.08978271484375, 17.634380340576172, 19.178979873657227, 20.72357940673828, 22.268177032470703, 23.812776565551758, 25.357376098632812, 26.901975631713867, 28.446575164794922, 29.991172790527344, 31.5357723236084, 33.08037185668945, 34.624969482421875, 36.16957092285156, 37.714168548583984, 39.258766174316406, 40.803367614746094, 42.347965240478516, 43.89256286621094, 45.437164306640625, 46.98176193237305, 48.52635955810547, 50.070960998535156]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 3.0, 4.0, 7.0, 4.0, 8.0, 10.0, 12.0, 22.0, 26.0, 31.0, 34.0, 47.0, 48.0, 67.0, 72.0, 68.0, 74.0, 74.0, 51.0, 56.0, 52.0, 49.0, 40.0, 37.0, 28.0, 23.0, 14.0, 13.0, 10.0, 6.0, 2.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.320974349975586, -16.800146102905273, -16.27931785583496, -15.758490562438965, -15.237663269042969, -14.716835021972656, -14.196006774902344, -13.675178527832031, -13.154351234436035, -12.633522987365723, -12.112695693969727, -11.591867446899414, -11.071039199829102, -10.550211906433105, -10.029383659362793, -9.508556365966797, -8.987728118896484, -8.466899871826172, -7.946072578430176, -7.425244331359863, -6.904416561126709, -6.383588790893555, -5.862760543823242, -5.341932773590088, -4.821105003356934, -4.300277233123779, -3.779449224472046, -3.2586212158203125, -2.737793445587158, -2.216965675354004, -1.6961376667022705, -1.175309658050537, -0.6544818878173828, -0.13365399837493896, 0.3871738910675049, 0.9080017805099487, 1.4288296699523926, 1.9496574401855469, 2.4704854488372803, 2.9913134574890137, 3.512141227722168, 4.032968997955322, 4.553796768188477, 5.074625015258789, 5.595452785491943, 6.116280555725098, 6.63710880279541, 7.1579365730285645, 7.678764343261719, 8.199592590332031, 8.720419883728027, 9.24124813079834, 9.762075424194336, 10.282903671264648, 10.803731918334961, 11.324560165405273, 11.84538745880127, 12.366215705871582, 12.887042999267578, 13.40787124633789, 13.928699493408203, 14.4495267868042, 14.970355033874512, 15.491182327270508, 16.01201057434082]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 2.0, 0.0, 0.0, 10.0, 4.0, 6.0, 6.0, 9.0, 25.0, 18.0, 10.0, 30.0, 36.0, 74.0, 308.0, 4165901.0, 27452.0, 197.0, 36.0, 24.0, 22.0, 24.0, 20.0, 14.0, 0.0, 14.0, 0.0, 10.0, 6.0, 2.0, 8.0, 2.0, 4.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0], "bins": [-194.25, -189.4951171875, -184.740234375, -179.9853515625, -175.23046875, -170.4755859375, -165.720703125, -160.9658203125, -156.2109375, -151.4560546875, -146.701171875, -141.9462890625, -137.19140625, -132.4365234375, -127.681640625, -122.9267578125, -118.171875, -113.4169921875, -108.662109375, -103.9072265625, -99.15234375, -94.3974609375, -89.642578125, -84.8876953125, -80.1328125, -75.3779296875, -70.623046875, -65.8681640625, -61.11328125, -56.3583984375, -51.603515625, -46.8486328125, -42.09375, -37.3388671875, -32.583984375, -27.8291015625, -23.07421875, -18.3193359375, -13.564453125, -8.8095703125, -4.0546875, 0.7001953125, 5.455078125, 10.2099609375, 14.96484375, 19.7197265625, 24.474609375, 29.2294921875, 33.984375, 38.7392578125, 43.494140625, 48.2490234375, 53.00390625, 57.7587890625, 62.513671875, 67.2685546875, 72.0234375, 76.7783203125, 81.533203125, 86.2880859375, 91.04296875, 95.7978515625, 100.552734375, 105.3076171875, 110.0625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 8.0, 5.0, 6.0, 10.0, 15.0, 13.0, 17.0, 28.0, 18.0, 31.0, 46.0, 42.0, 55.0, 50.0, 48.0, 42.0, 52.0, 62.0, 53.0, 42.0, 34.0, 45.0, 47.0, 34.0, 28.0, 25.0, 22.0, 23.0, 19.0, 13.0, 15.0, 13.0, 8.0, 9.0, 10.0, 1.0, 4.0, 4.0, 2.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.34814453125, -0.3383522033691406, -0.32855987548828125, -0.3187675476074219, -0.3089752197265625, -0.2991828918457031, -0.28939056396484375, -0.2795982360839844, -0.269805908203125, -0.2600135803222656, -0.25022125244140625, -0.24042892456054688, -0.2306365966796875, -0.22084426879882812, -0.21105194091796875, -0.20125961303710938, -0.19146728515625, -0.18167495727539062, -0.17188262939453125, -0.16209030151367188, -0.1522979736328125, -0.14250564575195312, -0.13271331787109375, -0.12292098999023438, -0.113128662109375, -0.10333633422851562, -0.09354400634765625, -0.08375167846679688, -0.0739593505859375, -0.06416702270507812, -0.05437469482421875, -0.044582366943359375, -0.0347900390625, -0.024997711181640625, -0.01520538330078125, -0.005413055419921875, 0.0043792724609375, 0.014171600341796875, 0.02396392822265625, 0.033756256103515625, 0.043548583984375, 0.053340911865234375, 0.06313323974609375, 0.07292556762695312, 0.0827178955078125, 0.09251022338867188, 0.10230255126953125, 0.11209487915039062, 0.12188720703125, 0.13167953491210938, 0.14147186279296875, 0.15126419067382812, 0.1610565185546875, 0.17084884643554688, 0.18064117431640625, 0.19043350219726562, 0.200225830078125, 0.21001815795898438, 0.21981048583984375, 0.22960281372070312, 0.2393951416015625, 0.24918746948242188, 0.25897979736328125, 0.2687721252441406, 0.278564453125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [8.0, 34.0, 637.0, 4193225.0, 351.0, 38.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.828125, -18.115966796875, -10.40380859375, -2.691650390625, 5.0205078125, 12.732666015625, 20.44482421875, 28.156982421875, 35.869140625, 43.581298828125, 51.29345703125, 59.005615234375, 66.7177734375, 74.429931640625, 82.14208984375, 89.854248046875, 97.56640625, 105.278564453125, 112.99072265625, 120.702880859375, 128.4150390625, 136.127197265625, 143.83935546875, 151.551513671875, 159.263671875, 166.975830078125, 174.68798828125, 182.400146484375, 190.1123046875, 197.824462890625, 205.53662109375, 213.248779296875, 220.9609375, 228.673095703125, 236.38525390625, 244.097412109375, 251.8095703125, 259.521728515625, 267.23388671875, 274.946044921875, 282.658203125, 290.370361328125, 298.08251953125, 305.794677734375, 313.5068359375, 321.218994140625, 328.93115234375, 336.643310546875, 344.35546875, 352.067626953125, 359.77978515625, 367.491943359375, 375.2041015625, 382.916259765625, 390.62841796875, 398.340576171875, 406.052734375, 413.764892578125, 421.47705078125, 429.189208984375, 436.9013671875, 444.613525390625, 452.32568359375, 460.037841796875, 467.75]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 7.0, 13.0, 13.0, 22.0, 21.0, 40.0, 72.0, 116.0, 304.0, 2232.0, 751.0, 250.0, 103.0, 59.0, 28.0, 19.0, 13.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2138671875, -1.1524200439453125, -1.090972900390625, -1.0295257568359375, -0.96807861328125, -0.9066314697265625, -0.845184326171875, -0.7837371826171875, -0.7222900390625, -0.6608428955078125, -0.599395751953125, -0.5379486083984375, -0.47650146484375, -0.4150543212890625, -0.353607177734375, -0.2921600341796875, -0.230712890625, -0.1692657470703125, -0.107818603515625, -0.0463714599609375, 0.01507568359375, 0.0765228271484375, 0.137969970703125, 0.1994171142578125, 0.2608642578125, 0.3223114013671875, 0.383758544921875, 0.4452056884765625, 0.50665283203125, 0.5680999755859375, 0.629547119140625, 0.6909942626953125, 0.75244140625, 0.8138885498046875, 0.875335693359375, 0.9367828369140625, 0.99822998046875, 1.0596771240234375, 1.121124267578125, 1.1825714111328125, 1.2440185546875, 1.3054656982421875, 1.366912841796875, 1.4283599853515625, 1.48980712890625, 1.5512542724609375, 1.612701416015625, 1.6741485595703125, 1.735595703125, 1.7970428466796875, 1.858489990234375, 1.9199371337890625, 1.98138427734375, 2.0428314208984375, 2.104278564453125, 2.1657257080078125, 2.2271728515625, 2.2886199951171875, 2.350067138671875, 2.4115142822265625, 2.47296142578125, 2.5344085693359375, 2.595855712890625, 2.6573028564453125, 2.71875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [110.0, 908.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.850528717041016, -1.6907825469970703, 16.468963623046875, 34.62871170043945, 52.788455963134766, 70.94819641113281, 89.10795593261719, 107.2677001953125, 125.42744445800781, 143.58718872070312, 161.74693298339844, 179.90667724609375, 198.06643676757812, 216.22616577148438, 234.38592529296875, 252.54566955566406, 270.7054138183594, 288.86517333984375, 307.02490234375, 325.1846618652344, 343.3443908691406, 361.504150390625, 379.66387939453125, 397.8236389160156, 415.9833679199219, 434.14312744140625, 452.3028564453125, 470.4626159667969, 488.6223449707031, 506.7821044921875, 524.9418334960938, 543.1015625, 561.2612915039062, 579.4210205078125, 597.580810546875, 615.7405395507812, 633.9002685546875, 652.0599975585938, 670.2197875976562, 688.3795166015625, 706.5392456054688, 724.698974609375, 742.8587646484375, 761.0184936523438, 779.17822265625, 797.3379516601562, 815.4977416992188, 833.657470703125, 851.8172607421875, 869.9769897460938, 888.1367797851562, 906.2965087890625, 924.4562377929688, 942.615966796875, 960.7757568359375, 978.9354858398438, 997.09521484375, 1015.2549438476562, 1033.4146728515625, 1051.574462890625, 1069.7342529296875, 1087.8939208984375, 1106.0537109375, 1124.21337890625, 1142.3731689453125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 20.0, 46.0, 74.0, 123.0, 215.0, 193.0, 147.0, 104.0, 47.0, 23.0, 12.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.951873779296875, -18.747283935546875, -17.542692184448242, -16.338102340698242, -15.133512496948242, -13.928921699523926, -12.72433090209961, -11.51974105834961, -10.315150260925293, -9.110559463500977, -7.905969619750977, -6.70137882232666, -5.496788501739502, -4.292198181152344, -3.0876073837280273, -1.8830175399780273, -0.6784267425537109, 0.5261636972427368, 1.7307541370391846, 2.935344696044922, 4.13993501663208, 5.344525337219238, 6.549116134643555, 7.753705978393555, 8.958296775817871, 10.162887573242188, 11.367477416992188, 12.572068214416504, 13.77665901184082, 14.98124885559082, 16.185840606689453, 17.390430450439453, 18.595020294189453, 19.799610137939453, 21.004201889038086, 22.208791732788086, 23.413381576538086, 24.61797332763672, 25.82256317138672, 27.02715301513672, 28.23174285888672, 29.43633270263672, 30.64092445373535, 31.84551429748535, 33.050106048583984, 34.254695892333984, 35.459285736083984, 36.663875579833984, 37.86846923828125, 39.07305908203125, 40.27764892578125, 41.48223876953125, 42.686832427978516, 43.891422271728516, 45.096012115478516, 46.300601959228516, 47.505191802978516, 48.709781646728516, 49.914371490478516, 51.11896514892578, 52.32355499267578, 53.52814483642578, 54.73273468017578, 55.93732452392578, 57.14191436767578]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 7.0, 6.0, 5.0, 2.0, 6.0, 7.0, 16.0, 9.0, 17.0, 25.0, 15.0, 23.0, 28.0, 39.0, 35.0, 36.0, 36.0, 69.0, 361.0, 11621.0, 1006058.0, 29159.0, 502.0, 107.0, 41.0, 38.0, 41.0, 41.0, 30.0, 32.0, 21.0, 18.0, 18.0, 17.0, 13.0, 9.0, 8.0, 9.0, 5.0, 11.0, 5.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.4375, -53.5634765625, -51.689453125, -49.8154296875, -47.94140625, -46.0673828125, -44.193359375, -42.3193359375, -40.4453125, -38.5712890625, -36.697265625, -34.8232421875, -32.94921875, -31.0751953125, -29.201171875, -27.3271484375, -25.453125, -23.5791015625, -21.705078125, -19.8310546875, -17.95703125, -16.0830078125, -14.208984375, -12.3349609375, -10.4609375, -8.5869140625, -6.712890625, -4.8388671875, -2.96484375, -1.0908203125, 0.783203125, 2.6572265625, 4.53125, 6.4052734375, 8.279296875, 10.1533203125, 12.02734375, 13.9013671875, 15.775390625, 17.6494140625, 19.5234375, 21.3974609375, 23.271484375, 25.1455078125, 27.01953125, 28.8935546875, 30.767578125, 32.6416015625, 34.515625, 36.3896484375, 38.263671875, 40.1376953125, 42.01171875, 43.8857421875, 45.759765625, 47.6337890625, 49.5078125, 51.3818359375, 53.255859375, 55.1298828125, 57.00390625, 58.8779296875, 60.751953125, 62.6259765625, 64.5]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 9.0, 63.0, 158.0, 258.0, 279.0, 160.0, 60.0, 21.0, 4.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95166015625, -0.7970199584960938, -0.6423797607421875, -0.48773956298828125, -0.333099365234375, -0.17845916748046875, -0.0238189697265625, 0.13082122802734375, 0.28546142578125, 0.44010162353515625, 0.5947418212890625, 0.7493820190429688, 0.904022216796875, 1.0586624145507812, 1.2133026123046875, 1.3679428100585938, 1.5225830078125, 1.6772232055664062, 1.8318634033203125, 1.9865036010742188, 2.141143798828125, 2.2957839965820312, 2.4504241943359375, 2.6050643920898438, 2.75970458984375, 2.9143447875976562, 3.0689849853515625, 3.2236251831054688, 3.378265380859375, 3.5329055786132812, 3.6875457763671875, 3.8421859741210938, 3.996826171875, 4.151466369628906, 4.3061065673828125, 4.460746765136719, 4.615386962890625, 4.770027160644531, 4.9246673583984375, 5.079307556152344, 5.23394775390625, 5.388587951660156, 5.5432281494140625, 5.697868347167969, 5.852508544921875, 6.007148742675781, 6.1617889404296875, 6.316429138183594, 6.4710693359375, 6.625709533691406, 6.7803497314453125, 6.934989929199219, 7.089630126953125, 7.244270324707031, 7.3989105224609375, 7.553550720214844, 7.70819091796875, 7.862831115722656, 8.017471313476562, 8.172111511230469, 8.326751708984375, 8.481391906738281, 8.636032104492188, 8.790672302246094, 8.9453125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 5.0, 3.0, 3.0, 2.0, 6.0, 6.0, 5.0, 7.0, 8.0, 19.0, 25.0, 31.0, 53.0, 81.0, 121.0, 194.0, 379.0, 946.0, 2957.0, 15965.0, 250208.0, 726001.0, 43517.0, 5362.0, 1490.0, 497.0, 238.0, 139.0, 87.0, 46.0, 48.0, 28.0, 20.0, 16.0, 12.0, 12.0, 7.0, 3.0, 3.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-39.625, -38.466796875, -37.30859375, -36.150390625, -34.9921875, -33.833984375, -32.67578125, -31.517578125, -30.359375, -29.201171875, -28.04296875, -26.884765625, -25.7265625, -24.568359375, -23.41015625, -22.251953125, -21.09375, -19.935546875, -18.77734375, -17.619140625, -16.4609375, -15.302734375, -14.14453125, -12.986328125, -11.828125, -10.669921875, -9.51171875, -8.353515625, -7.1953125, -6.037109375, -4.87890625, -3.720703125, -2.5625, -1.404296875, -0.24609375, 0.912109375, 2.0703125, 3.228515625, 4.38671875, 5.544921875, 6.703125, 7.861328125, 9.01953125, 10.177734375, 11.3359375, 12.494140625, 13.65234375, 14.810546875, 15.96875, 17.126953125, 18.28515625, 19.443359375, 20.6015625, 21.759765625, 22.91796875, 24.076171875, 25.234375, 26.392578125, 27.55078125, 28.708984375, 29.8671875, 31.025390625, 32.18359375, 33.341796875, 34.5]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 3.0, 7.0, 1.0, 3.0, 7.0, 9.0, 14.0, 17.0, 29.0, 23.0, 29.0, 42.0, 51.0, 49.0, 46.0, 49.0, 53.0, 33.0, 50.0, 67.0, 65.0, 51.0, 52.0, 41.0, 35.0, 28.0, 25.0, 37.0, 20.0, 16.0, 12.0, 9.0, 11.0, 5.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.265625, -8.96142578125, -8.6572265625, -8.35302734375, -8.048828125, -7.74462890625, -7.4404296875, -7.13623046875, -6.83203125, -6.52783203125, -6.2236328125, -5.91943359375, -5.615234375, -5.31103515625, -5.0068359375, -4.70263671875, -4.3984375, -4.09423828125, -3.7900390625, -3.48583984375, -3.181640625, -2.87744140625, -2.5732421875, -2.26904296875, -1.96484375, -1.66064453125, -1.3564453125, -1.05224609375, -0.748046875, -0.44384765625, -0.1396484375, 0.16455078125, 0.46875, 0.77294921875, 1.0771484375, 1.38134765625, 1.685546875, 1.98974609375, 2.2939453125, 2.59814453125, 2.90234375, 3.20654296875, 3.5107421875, 3.81494140625, 4.119140625, 4.42333984375, 4.7275390625, 5.03173828125, 5.3359375, 5.64013671875, 5.9443359375, 6.24853515625, 6.552734375, 6.85693359375, 7.1611328125, 7.46533203125, 7.76953125, 8.07373046875, 8.3779296875, 8.68212890625, 8.986328125, 9.29052734375, 9.5947265625, 9.89892578125, 10.203125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 8.0, 11.0, 17.0, 21.0, 38.0, 54.0, 92.0, 179.0, 401.0, 1109.0, 3731.0, 26510.0, 746258.0, 252454.0, 13704.0, 2483.0, 795.0, 338.0, 131.0, 70.0, 50.0, 33.0, 18.0, 10.0, 5.0, 11.0, 4.0, 5.0, 4.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.90625, -42.52783203125, -41.1494140625, -39.77099609375, -38.392578125, -37.01416015625, -35.6357421875, -34.25732421875, -32.87890625, -31.50048828125, -30.1220703125, -28.74365234375, -27.365234375, -25.98681640625, -24.6083984375, -23.22998046875, -21.8515625, -20.47314453125, -19.0947265625, -17.71630859375, -16.337890625, -14.95947265625, -13.5810546875, -12.20263671875, -10.82421875, -9.44580078125, -8.0673828125, -6.68896484375, -5.310546875, -3.93212890625, -2.5537109375, -1.17529296875, 0.203125, 1.58154296875, 2.9599609375, 4.33837890625, 5.716796875, 7.09521484375, 8.4736328125, 9.85205078125, 11.23046875, 12.60888671875, 13.9873046875, 15.36572265625, 16.744140625, 18.12255859375, 19.5009765625, 20.87939453125, 22.2578125, 23.63623046875, 25.0146484375, 26.39306640625, 27.771484375, 29.14990234375, 30.5283203125, 31.90673828125, 33.28515625, 34.66357421875, 36.0419921875, 37.42041015625, 38.798828125, 40.17724609375, 41.5556640625, 42.93408203125, 44.3125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 4.0, 8.0, 10.0, 24.0, 23.0, 40.0, 53.0, 83.0, 153.0, 198.0, 136.0, 93.0, 55.0, 40.0, 20.0, 21.0, 10.0, 9.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002452850341796875, -0.0023600757122039795, -0.002267301082611084, -0.0021745264530181885, -0.002081751823425293, -0.0019889771938323975, -0.001896202564239502, -0.0018034279346466064, -0.001710653305053711, -0.0016178786754608154, -0.00152510404586792, -0.0014323294162750244, -0.001339554786682129, -0.0012467801570892334, -0.0011540055274963379, -0.0010612308979034424, -0.0009684562683105469, -0.0008756816387176514, -0.0007829070091247559, -0.0006901323795318604, -0.0005973577499389648, -0.0005045831203460693, -0.00041180849075317383, -0.0003190338611602783, -0.0002262592315673828, -0.0001334846019744873, -4.07099723815918e-05, 5.206465721130371e-05, 0.00014483928680419922, 0.00023761391639709473, 0.00033038854598999023, 0.00042316317558288574, 0.0005159378051757812, 0.0006087124347686768, 0.0007014870643615723, 0.0007942616939544678, 0.0008870363235473633, 0.0009798109531402588, 0.0010725855827331543, 0.0011653602123260498, 0.0012581348419189453, 0.0013509094715118408, 0.0014436841011047363, 0.0015364587306976318, 0.0016292333602905273, 0.0017220079898834229, 0.0018147826194763184, 0.0019075572490692139, 0.0020003318786621094, 0.002093106508255005, 0.0021858811378479004, 0.002278655767440796, 0.0023714303970336914, 0.002464205026626587, 0.0025569796562194824, 0.002649754285812378, 0.0027425289154052734, 0.002835303544998169, 0.0029280781745910645, 0.00302085280418396, 0.0031136274337768555, 0.003206402063369751, 0.0032991766929626465, 0.003391951322555542, 0.0034847259521484375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 7.0, 4.0, 6.0, 11.0, 15.0, 20.0, 41.0, 75.0, 160.0, 404.0, 1476.0, 10095.0, 746006.0, 281948.0, 6474.0, 1142.0, 344.0, 138.0, 66.0, 51.0, 25.0, 10.0, 10.0, 4.0, 4.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.90625, -51.34619140625, -49.7861328125, -48.22607421875, -46.666015625, -45.10595703125, -43.5458984375, -41.98583984375, -40.42578125, -38.86572265625, -37.3056640625, -35.74560546875, -34.185546875, -32.62548828125, -31.0654296875, -29.50537109375, -27.9453125, -26.38525390625, -24.8251953125, -23.26513671875, -21.705078125, -20.14501953125, -18.5849609375, -17.02490234375, -15.46484375, -13.90478515625, -12.3447265625, -10.78466796875, -9.224609375, -7.66455078125, -6.1044921875, -4.54443359375, -2.984375, -1.42431640625, 0.1357421875, 1.69580078125, 3.255859375, 4.81591796875, 6.3759765625, 7.93603515625, 9.49609375, 11.05615234375, 12.6162109375, 14.17626953125, 15.736328125, 17.29638671875, 18.8564453125, 20.41650390625, 21.9765625, 23.53662109375, 25.0966796875, 26.65673828125, 28.216796875, 29.77685546875, 31.3369140625, 32.89697265625, 34.45703125, 36.01708984375, 37.5771484375, 39.13720703125, 40.697265625, 42.25732421875, 43.8173828125, 45.37744140625, 46.9375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 5.0, 4.0, 6.0, 8.0, 6.0, 11.0, 11.0, 33.0, 36.0, 71.0, 99.0, 107.0, 135.0, 144.0, 92.0, 60.0, 54.0, 35.0, 25.0, 11.0, 16.0, 8.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9140625, -11.5498046875, -11.185546875, -10.8212890625, -10.45703125, -10.0927734375, -9.728515625, -9.3642578125, -9.0, -8.6357421875, -8.271484375, -7.9072265625, -7.54296875, -7.1787109375, -6.814453125, -6.4501953125, -6.0859375, -5.7216796875, -5.357421875, -4.9931640625, -4.62890625, -4.2646484375, -3.900390625, -3.5361328125, -3.171875, -2.8076171875, -2.443359375, -2.0791015625, -1.71484375, -1.3505859375, -0.986328125, -0.6220703125, -0.2578125, 0.1064453125, 0.470703125, 0.8349609375, 1.19921875, 1.5634765625, 1.927734375, 2.2919921875, 2.65625, 3.0205078125, 3.384765625, 3.7490234375, 4.11328125, 4.4775390625, 4.841796875, 5.2060546875, 5.5703125, 5.9345703125, 6.298828125, 6.6630859375, 7.02734375, 7.3916015625, 7.755859375, 8.1201171875, 8.484375, 8.8486328125, 9.212890625, 9.5771484375, 9.94140625, 10.3056640625, 10.669921875, 11.0341796875, 11.3984375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 3.0, 0.0, 2.0, 6.0, 8.0, 35.0, 197.0, 570.0, 157.0, 28.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-592.0087890625, -580.5338745117188, -569.0589599609375, -557.5840454101562, -546.109130859375, -534.6342163085938, -523.1593017578125, -511.6844177246094, -500.2095031738281, -488.7345886230469, -477.2596740722656, -465.7847595214844, -454.3098449707031, -442.8349609375, -431.36004638671875, -419.8851318359375, -408.41021728515625, -396.935302734375, -385.46038818359375, -373.9854736328125, -362.51055908203125, -351.03564453125, -339.56072998046875, -328.0858459472656, -316.61090087890625, -305.135986328125, -293.66107177734375, -282.1861572265625, -270.71124267578125, -259.236328125, -247.7614288330078, -236.28652954101562, -224.81163024902344, -213.3367156982422, -201.86180114746094, -190.38690185546875, -178.9119873046875, -167.43707275390625, -155.962158203125, -144.48724365234375, -133.0123291015625, -121.53741455078125, -110.06250762939453, -98.58759307861328, -87.11268615722656, -75.63777160644531, -64.16285705566406, -52.687950134277344, -41.213043212890625, -29.73813247680664, -18.263219833374023, -6.788307189941406, 4.686603546142578, 16.161514282226562, 27.636428833007812, 39.11133575439453, 50.58625030517578, 62.061161041259766, 73.53607177734375, 85.010986328125, 96.48590087890625, 107.96080780029297, 119.43572235107422, 130.91062927246094, 142.3855438232422]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 13.0, 22.0, 23.0, 33.0, 23.0, 46.0, 36.0, 44.0, 70.0, 70.0, 78.0, 60.0, 77.0, 64.0, 71.0, 61.0, 52.0, 50.0, 29.0, 18.0, 20.0, 11.0, 6.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-104.25460052490234, -101.61312103271484, -98.97164154052734, -96.33016204833984, -93.68867492675781, -91.04719543457031, -88.40571594238281, -85.76423645019531, -83.12275695800781, -80.48127746582031, -77.83979797363281, -75.19831848144531, -72.55683898925781, -69.91535186767578, -67.27387237548828, -64.63239288330078, -61.99091339111328, -59.34943389892578, -56.70795440673828, -54.066471099853516, -51.424991607666016, -48.783512115478516, -46.14202880859375, -43.50054931640625, -40.85906982421875, -38.21759033203125, -35.57611083984375, -32.934627532958984, -30.293148040771484, -27.651668548583984, -25.01018714904785, -22.36870574951172, -19.72723388671875, -17.08575439453125, -14.444272994995117, -11.8027925491333, -9.161312103271484, -6.519831657409668, -3.8783512115478516, -1.2368698120117188, 1.4046096801757812, 4.046090126037598, 6.687570571899414, 9.32905101776123, 11.970531463623047, 14.612011909484863, 17.25349235534668, 19.894973754882812, 22.536453247070312, 25.177932739257812, 27.819414138793945, 30.460895538330078, 33.10237503051758, 35.74385452270508, 38.385337829589844, 41.026817321777344, 43.668296813964844, 46.309776306152344, 48.951255798339844, 51.59273910522461, 54.23421859741211, 56.87569808959961, 59.517181396484375, 62.158660888671875, 64.80014038085938]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 6.0, 26.0, 71.0, 344.0, 2287.0, 4188288.0, 2496.0, 493.0, 123.0, 72.0, 40.0, 21.0, 12.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-95.375, -87.755859375, -80.13671875, -72.517578125, -64.8984375, -57.279296875, -49.66015625, -42.041015625, -34.421875, -26.802734375, -19.18359375, -11.564453125, -3.9453125, 3.673828125, 11.29296875, 18.912109375, 26.53125, 34.150390625, 41.76953125, 49.388671875, 57.0078125, 64.626953125, 72.24609375, 79.865234375, 87.484375, 95.103515625, 102.72265625, 110.341796875, 117.9609375, 125.580078125, 133.19921875, 140.818359375, 148.4375, 156.056640625, 163.67578125, 171.294921875, 178.9140625, 186.533203125, 194.15234375, 201.771484375, 209.390625, 217.009765625, 224.62890625, 232.248046875, 239.8671875, 247.486328125, 255.10546875, 262.724609375, 270.34375, 277.962890625, 285.58203125, 293.201171875, 300.8203125, 308.439453125, 316.05859375, 323.677734375, 331.296875, 338.916015625, 346.53515625, 354.154296875, 361.7734375, 369.392578125, 377.01171875, 384.630859375, 392.25]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 16.0, 61.0, 146.0, 233.0, 274.0, 184.0, 74.0, 11.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.88671875, -2.68292236328125, -2.4791259765625, -2.27532958984375, -2.071533203125, -1.86773681640625, -1.6639404296875, -1.46014404296875, -1.25634765625, -1.05255126953125, -0.8487548828125, -0.64495849609375, -0.441162109375, -0.23736572265625, -0.0335693359375, 0.17022705078125, 0.3740234375, 0.57781982421875, 0.7816162109375, 0.98541259765625, 1.189208984375, 1.39300537109375, 1.5968017578125, 1.80059814453125, 2.00439453125, 2.20819091796875, 2.4119873046875, 2.61578369140625, 2.819580078125, 3.02337646484375, 3.2271728515625, 3.43096923828125, 3.634765625, 3.83856201171875, 4.0423583984375, 4.24615478515625, 4.449951171875, 4.65374755859375, 4.8575439453125, 5.06134033203125, 5.26513671875, 5.46893310546875, 5.6727294921875, 5.87652587890625, 6.080322265625, 6.28411865234375, 6.4879150390625, 6.69171142578125, 6.8955078125, 7.09930419921875, 7.3031005859375, 7.50689697265625, 7.710693359375, 7.91448974609375, 8.1182861328125, 8.32208251953125, 8.52587890625, 8.72967529296875, 8.9334716796875, 9.13726806640625, 9.341064453125, 9.54486083984375, 9.7486572265625, 9.95245361328125, 10.15625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 11.0, 16.0, 41.0, 103.0, 174.0, 263.0, 7440.0, 4185240.0, 366.0, 279.0, 158.0, 86.0, 55.0, 30.0, 16.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-356.0, -336.3984375, -316.796875, -297.1953125, -277.59375, -257.9921875, -238.390625, -218.7890625, -199.1875, -179.5859375, -159.984375, -140.3828125, -120.78125, -101.1796875, -81.578125, -61.9765625, -42.375, -22.7734375, -3.171875, 16.4296875, 36.03125, 55.6328125, 75.234375, 94.8359375, 114.4375, 134.0390625, 153.640625, 173.2421875, 192.84375, 212.4453125, 232.046875, 251.6484375, 271.25, 290.8515625, 310.453125, 330.0546875, 349.65625, 369.2578125, 388.859375, 408.4609375, 428.0625, 447.6640625, 467.265625, 486.8671875, 506.46875, 526.0703125, 545.671875, 565.2734375, 584.875, 604.4765625, 624.078125, 643.6796875, 663.28125, 682.8828125, 702.484375, 722.0859375, 741.6875, 761.2890625, 780.890625, 800.4921875, 820.09375, 839.6953125, 859.296875, 878.8984375, 898.5]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 9.0, 58.0, 1159.0, 2763.0, 77.0, 13.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.9921875, -6.9976806640625, -6.003173828125, -5.0086669921875, -4.01416015625, -3.0196533203125, -2.025146484375, -1.0306396484375, -0.0361328125, 0.9583740234375, 1.952880859375, 2.9473876953125, 3.94189453125, 4.9364013671875, 5.930908203125, 6.9254150390625, 7.919921875, 8.9144287109375, 9.908935546875, 10.9034423828125, 11.89794921875, 12.8924560546875, 13.886962890625, 14.8814697265625, 15.8759765625, 16.8704833984375, 17.864990234375, 18.8594970703125, 19.85400390625, 20.8485107421875, 21.843017578125, 22.8375244140625, 23.83203125, 24.8265380859375, 25.821044921875, 26.8155517578125, 27.81005859375, 28.8045654296875, 29.799072265625, 30.7935791015625, 31.7880859375, 32.7825927734375, 33.777099609375, 34.7716064453125, 35.76611328125, 36.7606201171875, 37.755126953125, 38.7496337890625, 39.744140625, 40.7386474609375, 41.733154296875, 42.7276611328125, 43.72216796875, 44.7166748046875, 45.711181640625, 46.7056884765625, 47.7001953125, 48.6947021484375, 49.689208984375, 50.6837158203125, 51.67822265625, 52.6727294921875, 53.667236328125, 54.6617431640625, 55.65625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 15.0, 380.0, 592.0, 23.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-398.337646484375, -367.76678466796875, -337.1959228515625, -306.62506103515625, -276.05419921875, -245.4833221435547, -214.91246032714844, -184.3415985107422, -153.77073669433594, -123.19987487792969, -92.62901306152344, -62.058143615722656, -31.487281799316406, -0.916412353515625, 29.654449462890625, 60.225311279296875, 90.79617309570312, 121.36703491210938, 151.93789672851562, 182.50875854492188, 213.07962036132812, 243.65049743652344, 274.22137451171875, 304.792236328125, 335.36309814453125, 365.9339599609375, 396.50482177734375, 427.07568359375, 457.64654541015625, 488.2174072265625, 518.7882690429688, 549.359130859375, 579.9299926757812, 610.5008544921875, 641.0717163085938, 671.642578125, 702.2134399414062, 732.7843017578125, 763.3551635742188, 793.926025390625, 824.4968872070312, 855.0677490234375, 885.6386108398438, 916.20947265625, 946.7803344726562, 977.3511962890625, 1007.9220581054688, 1038.492919921875, 1069.0638427734375, 1099.634765625, 1130.20556640625, 1160.7764892578125, 1191.3472900390625, 1221.918212890625, 1252.489013671875, 1283.0599365234375, 1313.6307373046875, 1344.20166015625, 1374.7724609375, 1405.3433837890625, 1435.9141845703125, 1466.485107421875, 1497.055908203125, 1527.6268310546875, 1558.1976318359375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 12.0, 29.0, 65.0, 83.0, 124.0, 163.0, 156.0, 136.0, 98.0, 67.0, 31.0, 21.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-197.8023223876953, -192.02099609375, -186.2396697998047, -180.45834350585938, -174.67701721191406, -168.89569091796875, -163.1143798828125, -157.33303833007812, -151.55172729492188, -145.77040100097656, -139.98907470703125, -134.20774841308594, -128.42642211914062, -122.64509582519531, -116.86377716064453, -111.08245086669922, -105.30111694335938, -99.51979064941406, -93.73846435546875, -87.95713806152344, -82.17581176757812, -76.39448547363281, -70.61316680908203, -64.83184051513672, -59.050514221191406, -53.269187927246094, -47.48786163330078, -41.706539154052734, -35.92521286010742, -30.14388656616211, -24.362564086914062, -18.58123779296875, -12.7999267578125, -7.018601417541504, -1.2372760772705078, 4.544048309326172, 10.325374603271484, 16.106700897216797, 21.888023376464844, 27.669349670410156, 33.45067596435547, 39.23200225830078, 45.013328552246094, 50.79465103149414, 56.57597732543945, 62.357303619384766, 68.13862609863281, 73.91995239257812, 79.70127868652344, 85.48260498046875, 91.26393127441406, 97.04525756835938, 102.82658386230469, 108.60791015625, 114.38922882080078, 120.1705551147461, 125.9518814086914, 131.7332000732422, 137.5145263671875, 143.2958526611328, 149.07717895507812, 154.85850524902344, 160.63983154296875, 166.42115783691406, 172.20248413085938]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 4.0, 9.0, 11.0, 17.0, 22.0, 30.0, 27.0, 48.0, 65.0, 104.0, 182.0, 319.0, 675.0, 1649.0, 5694.0, 40075.0, 712318.0, 263228.0, 18256.0, 3391.0, 1181.0, 510.0, 254.0, 170.0, 76.0, 62.0, 43.0, 30.0, 19.0, 19.0, 10.0, 8.0, 7.0, 10.0, 10.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-98.625, -95.8720703125, -93.119140625, -90.3662109375, -87.61328125, -84.8603515625, -82.107421875, -79.3544921875, -76.6015625, -73.8486328125, -71.095703125, -68.3427734375, -65.58984375, -62.8369140625, -60.083984375, -57.3310546875, -54.578125, -51.8251953125, -49.072265625, -46.3193359375, -43.56640625, -40.8134765625, -38.060546875, -35.3076171875, -32.5546875, -29.8017578125, -27.048828125, -24.2958984375, -21.54296875, -18.7900390625, -16.037109375, -13.2841796875, -10.53125, -7.7783203125, -5.025390625, -2.2724609375, 0.48046875, 3.2333984375, 5.986328125, 8.7392578125, 11.4921875, 14.2451171875, 16.998046875, 19.7509765625, 22.50390625, 25.2568359375, 28.009765625, 30.7626953125, 33.515625, 36.2685546875, 39.021484375, 41.7744140625, 44.52734375, 47.2802734375, 50.033203125, 52.7861328125, 55.5390625, 58.2919921875, 61.044921875, 63.7978515625, 66.55078125, 69.3037109375, 72.056640625, 74.8095703125, 77.5625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 10.0, 26.0, 38.0, 88.0, 134.0, 142.0, 182.0, 142.0, 104.0, 72.0, 33.0, 11.0, 10.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3515625, -7.022705078125, -6.69384765625, -6.364990234375, -6.0361328125, -5.707275390625, -5.37841796875, -5.049560546875, -4.720703125, -4.391845703125, -4.06298828125, -3.734130859375, -3.4052734375, -3.076416015625, -2.74755859375, -2.418701171875, -2.08984375, -1.760986328125, -1.43212890625, -1.103271484375, -0.7744140625, -0.445556640625, -0.11669921875, 0.212158203125, 0.541015625, 0.869873046875, 1.19873046875, 1.527587890625, 1.8564453125, 2.185302734375, 2.51416015625, 2.843017578125, 3.171875, 3.500732421875, 3.82958984375, 4.158447265625, 4.4873046875, 4.816162109375, 5.14501953125, 5.473876953125, 5.802734375, 6.131591796875, 6.46044921875, 6.789306640625, 7.1181640625, 7.447021484375, 7.77587890625, 8.104736328125, 8.43359375, 8.762451171875, 9.09130859375, 9.420166015625, 9.7490234375, 10.077880859375, 10.40673828125, 10.735595703125, 11.064453125, 11.393310546875, 11.72216796875, 12.051025390625, 12.3798828125, 12.708740234375, 13.03759765625, 13.366455078125, 13.6953125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 8.0, 12.0, 16.0, 16.0, 17.0, 30.0, 37.0, 49.0, 110.0, 178.0, 339.0, 660.0, 1680.0, 5815.0, 36918.0, 653503.0, 320354.0, 22071.0, 4185.0, 1298.0, 527.0, 274.0, 158.0, 90.0, 49.0, 45.0, 33.0, 25.0, 14.0, 12.0, 9.0, 5.0, 6.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-56.03125, -54.02099609375, -52.0107421875, -50.00048828125, -47.990234375, -45.97998046875, -43.9697265625, -41.95947265625, -39.94921875, -37.93896484375, -35.9287109375, -33.91845703125, -31.908203125, -29.89794921875, -27.8876953125, -25.87744140625, -23.8671875, -21.85693359375, -19.8466796875, -17.83642578125, -15.826171875, -13.81591796875, -11.8056640625, -9.79541015625, -7.78515625, -5.77490234375, -3.7646484375, -1.75439453125, 0.255859375, 2.26611328125, 4.2763671875, 6.28662109375, 8.296875, 10.30712890625, 12.3173828125, 14.32763671875, 16.337890625, 18.34814453125, 20.3583984375, 22.36865234375, 24.37890625, 26.38916015625, 28.3994140625, 30.40966796875, 32.419921875, 34.43017578125, 36.4404296875, 38.45068359375, 40.4609375, 42.47119140625, 44.4814453125, 46.49169921875, 48.501953125, 50.51220703125, 52.5224609375, 54.53271484375, 56.54296875, 58.55322265625, 60.5634765625, 62.57373046875, 64.583984375, 66.59423828125, 68.6044921875, 70.61474609375, 72.625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 5.0, 7.0, 6.0, 7.0, 10.0, 4.0, 17.0, 14.0, 22.0, 16.0, 28.0, 49.0, 33.0, 47.0, 54.0, 53.0, 47.0, 73.0, 63.0, 67.0, 54.0, 58.0, 47.0, 40.0, 28.0, 30.0, 26.0, 17.0, 13.0, 11.0, 15.0, 17.0, 9.0, 3.0, 3.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.0625, -16.470458984375, -15.87841796875, -15.286376953125, -14.6943359375, -14.102294921875, -13.51025390625, -12.918212890625, -12.326171875, -11.734130859375, -11.14208984375, -10.550048828125, -9.9580078125, -9.365966796875, -8.77392578125, -8.181884765625, -7.58984375, -6.997802734375, -6.40576171875, -5.813720703125, -5.2216796875, -4.629638671875, -4.03759765625, -3.445556640625, -2.853515625, -2.261474609375, -1.66943359375, -1.077392578125, -0.4853515625, 0.106689453125, 0.69873046875, 1.290771484375, 1.8828125, 2.474853515625, 3.06689453125, 3.658935546875, 4.2509765625, 4.843017578125, 5.43505859375, 6.027099609375, 6.619140625, 7.211181640625, 7.80322265625, 8.395263671875, 8.9873046875, 9.579345703125, 10.17138671875, 10.763427734375, 11.35546875, 11.947509765625, 12.53955078125, 13.131591796875, 13.7236328125, 14.315673828125, 14.90771484375, 15.499755859375, 16.091796875, 16.683837890625, 17.27587890625, 17.867919921875, 18.4599609375, 19.052001953125, 19.64404296875, 20.236083984375, 20.828125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 6.0, 6.0, 15.0, 11.0, 18.0, 29.0, 76.0, 120.0, 253.0, 558.0, 1876.0, 10366.0, 1010697.0, 20695.0, 2491.0, 745.0, 267.0, 134.0, 79.0, 43.0, 18.0, 13.0, 12.0, 10.0, 4.0, 4.0, 1.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-170.125, -164.1796875, -158.234375, -152.2890625, -146.34375, -140.3984375, -134.453125, -128.5078125, -122.5625, -116.6171875, -110.671875, -104.7265625, -98.78125, -92.8359375, -86.890625, -80.9453125, -75.0, -69.0546875, -63.109375, -57.1640625, -51.21875, -45.2734375, -39.328125, -33.3828125, -27.4375, -21.4921875, -15.546875, -9.6015625, -3.65625, 2.2890625, 8.234375, 14.1796875, 20.125, 26.0703125, 32.015625, 37.9609375, 43.90625, 49.8515625, 55.796875, 61.7421875, 67.6875, 73.6328125, 79.578125, 85.5234375, 91.46875, 97.4140625, 103.359375, 109.3046875, 115.25, 121.1953125, 127.140625, 133.0859375, 139.03125, 144.9765625, 150.921875, 156.8671875, 162.8125, 168.7578125, 174.703125, 180.6484375, 186.59375, 192.5390625, 198.484375, 204.4296875, 210.375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 7.0, 17.0, 60.0, 228.0, 442.0, 159.0, 53.0, 13.0, 12.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007232666015625, -0.0067901611328125, -0.00634765625, -0.0059051513671875, -0.005462646484375, -0.0050201416015625, -0.00457763671875, -0.0041351318359375, -0.003692626953125, -0.0032501220703125, -0.0028076171875, -0.0023651123046875, -0.001922607421875, -0.0014801025390625, -0.00103759765625, -0.0005950927734375, -0.000152587890625, 0.0002899169921875, 0.000732421875, 0.0011749267578125, 0.001617431640625, 0.0020599365234375, 0.00250244140625, 0.0029449462890625, 0.003387451171875, 0.0038299560546875, 0.0042724609375, 0.0047149658203125, 0.005157470703125, 0.0055999755859375, 0.00604248046875, 0.0064849853515625, 0.006927490234375, 0.0073699951171875, 0.0078125, 0.0082550048828125, 0.008697509765625, 0.0091400146484375, 0.00958251953125, 0.0100250244140625, 0.010467529296875, 0.0109100341796875, 0.0113525390625, 0.0117950439453125, 0.012237548828125, 0.0126800537109375, 0.01312255859375, 0.0135650634765625, 0.014007568359375, 0.0144500732421875, 0.014892578125, 0.0153350830078125, 0.015777587890625, 0.0162200927734375, 0.01666259765625, 0.0171051025390625, 0.017547607421875, 0.0179901123046875, 0.0184326171875, 0.0188751220703125, 0.019317626953125, 0.0197601318359375, 0.02020263671875, 0.0206451416015625, 0.021087646484375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 10.0, 13.0, 14.0, 43.0, 88.0, 247.0, 1227.0, 286629.0, 758376.0, 1438.0, 248.0, 104.0, 56.0, 26.0, 12.0, 4.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-146.125, -137.541015625, -128.95703125, -120.373046875, -111.7890625, -103.205078125, -94.62109375, -86.037109375, -77.453125, -68.869140625, -60.28515625, -51.701171875, -43.1171875, -34.533203125, -25.94921875, -17.365234375, -8.78125, -0.197265625, 8.38671875, 16.970703125, 25.5546875, 34.138671875, 42.72265625, 51.306640625, 59.890625, 68.474609375, 77.05859375, 85.642578125, 94.2265625, 102.810546875, 111.39453125, 119.978515625, 128.5625, 137.146484375, 145.73046875, 154.314453125, 162.8984375, 171.482421875, 180.06640625, 188.650390625, 197.234375, 205.818359375, 214.40234375, 222.986328125, 231.5703125, 240.154296875, 248.73828125, 257.322265625, 265.90625, 274.490234375, 283.07421875, 291.658203125, 300.2421875, 308.826171875, 317.41015625, 325.994140625, 334.578125, 343.162109375, 351.74609375, 360.330078125, 368.9140625, 377.498046875, 386.08203125, 394.666015625, 403.25]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 8.0, 19.0, 163.0, 508.0, 239.0, 32.0, 5.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.71875, -37.33056640625, -34.9423828125, -32.55419921875, -30.166015625, -27.77783203125, -25.3896484375, -23.00146484375, -20.61328125, -18.22509765625, -15.8369140625, -13.44873046875, -11.060546875, -8.67236328125, -6.2841796875, -3.89599609375, -1.5078125, 0.88037109375, 3.2685546875, 5.65673828125, 8.044921875, 10.43310546875, 12.8212890625, 15.20947265625, 17.59765625, 19.98583984375, 22.3740234375, 24.76220703125, 27.150390625, 29.53857421875, 31.9267578125, 34.31494140625, 36.703125, 39.09130859375, 41.4794921875, 43.86767578125, 46.255859375, 48.64404296875, 51.0322265625, 53.42041015625, 55.80859375, 58.19677734375, 60.5849609375, 62.97314453125, 65.361328125, 67.74951171875, 70.1376953125, 72.52587890625, 74.9140625, 77.30224609375, 79.6904296875, 82.07861328125, 84.466796875, 86.85498046875, 89.2431640625, 91.63134765625, 94.01953125, 96.40771484375, 98.7958984375, 101.18408203125, 103.572265625, 105.96044921875, 108.3486328125, 110.73681640625, 113.125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 8.0, 28.0, 697.0, 268.0, 9.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3101.5537109375, -3047.957275390625, -2994.360595703125, -2940.76416015625, -2887.167724609375, -2833.571044921875, -2779.974609375, -2726.378173828125, -2672.781494140625, -2619.18505859375, -2565.58837890625, -2511.991943359375, -2458.3955078125, -2404.798828125, -2351.202392578125, -2297.60595703125, -2244.009521484375, -2190.4130859375, -2136.81640625, -2083.219970703125, -2029.6234130859375, -1976.0269775390625, -1922.430419921875, -1868.833984375, -1815.2373046875, -1761.6407470703125, -1708.0443115234375, -1654.44775390625, -1600.8511962890625, -1547.2547607421875, -1493.658203125, -1440.061767578125, -1386.46533203125, -1332.8687744140625, -1279.2723388671875, -1225.67578125, -1172.0792236328125, -1118.4827880859375, -1064.88623046875, -1011.2897338867188, -957.6931762695312, -904.0966796875, -850.5001220703125, -796.9036254882812, -743.30712890625, -689.7105712890625, -636.1140747070312, -582.517578125, -528.9210205078125, -475.3244934082031, -421.7279968261719, -368.1314697265625, -314.53497314453125, -260.9384460449219, -207.3419189453125, -153.74542236328125, -100.14892578125, -46.55241012573242, 7.044105529785156, 60.640625, 114.23713684082031, 167.83364868164062, 221.43017578125, 275.02667236328125, 328.6231994628906]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 6.0, 7.0, 7.0, 8.0, 13.0, 22.0, 27.0, 32.0, 40.0, 45.0, 65.0, 82.0, 76.0, 87.0, 78.0, 56.0, 67.0, 57.0, 60.0, 39.0, 42.0, 27.0, 14.0, 10.0, 12.0, 13.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-183.6237030029297, -178.1049041748047, -172.58609008789062, -167.06729125976562, -161.54849243164062, -156.02967834472656, -150.51087951660156, -144.9920654296875, -139.4732666015625, -133.9544677734375, -128.43565368652344, -122.91685485839844, -117.3980484008789, -111.87924194335938, -106.36044311523438, -100.84163665771484, -95.32283782958984, -89.80403137207031, -84.28523254394531, -78.76642608642578, -73.24761962890625, -67.72882080078125, -62.21001434326172, -56.69120788574219, -51.17240524291992, -45.653602600097656, -40.134796142578125, -34.61599349975586, -29.09718894958496, -23.578384399414062, -18.059581756591797, -12.540775299072266, -7.02197265625, -1.5031685829162598, 4.0156354904174805, 9.534439086914062, 15.053243637084961, 20.57204818725586, 26.090850830078125, 31.609657287597656, 37.12845993041992, 42.64726257324219, 48.16606903076172, 53.684871673583984, 59.20367431640625, 64.72248077392578, 70.24128723144531, 75.76008605957031, 81.27889251708984, 86.79769897460938, 92.31649780273438, 97.8353042602539, 103.35411071777344, 108.87290954589844, 114.39171600341797, 119.9105224609375, 125.4293212890625, 130.9481201171875, 136.46693420410156, 141.98573303222656, 147.50453186035156, 153.02334594726562, 158.54214477539062, 164.06094360351562, 169.5797576904297]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 12.0, 34.0, 65.0, 87.0, 301.0, 863.0, 3489.0, 29386.0, 3956131.0, 192359.0, 8440.0, 1724.0, 631.0, 304.0, 135.0, 81.0, 73.0, 39.0, 34.0, 18.0, 20.0, 13.0, 9.0, 8.0, 10.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.78125, -55.27490234375, -51.7685546875, -48.26220703125, -44.755859375, -41.24951171875, -37.7431640625, -34.23681640625, -30.73046875, -27.22412109375, -23.7177734375, -20.21142578125, -16.705078125, -13.19873046875, -9.6923828125, -6.18603515625, -2.6796875, 0.82666015625, 4.3330078125, 7.83935546875, 11.345703125, 14.85205078125, 18.3583984375, 21.86474609375, 25.37109375, 28.87744140625, 32.3837890625, 35.89013671875, 39.396484375, 42.90283203125, 46.4091796875, 49.91552734375, 53.421875, 56.92822265625, 60.4345703125, 63.94091796875, 67.447265625, 70.95361328125, 74.4599609375, 77.96630859375, 81.47265625, 84.97900390625, 88.4853515625, 91.99169921875, 95.498046875, 99.00439453125, 102.5107421875, 106.01708984375, 109.5234375, 113.02978515625, 116.5361328125, 120.04248046875, 123.548828125, 127.05517578125, 130.5615234375, 134.06787109375, 137.57421875, 141.08056640625, 144.5869140625, 148.09326171875, 151.599609375, 155.10595703125, 158.6123046875, 162.11865234375, 165.625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 5.0, 13.0, 20.0, 36.0, 52.0, 68.0, 80.0, 121.0, 131.0, 155.0, 123.0, 84.0, 50.0, 27.0, 18.0, 10.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0703125, -3.792724609375, -3.51513671875, -3.237548828125, -2.9599609375, -2.682373046875, -2.40478515625, -2.127197265625, -1.849609375, -1.572021484375, -1.29443359375, -1.016845703125, -0.7392578125, -0.461669921875, -0.18408203125, 0.093505859375, 0.37109375, 0.648681640625, 0.92626953125, 1.203857421875, 1.4814453125, 1.759033203125, 2.03662109375, 2.314208984375, 2.591796875, 2.869384765625, 3.14697265625, 3.424560546875, 3.7021484375, 3.979736328125, 4.25732421875, 4.534912109375, 4.8125, 5.090087890625, 5.36767578125, 5.645263671875, 5.9228515625, 6.200439453125, 6.47802734375, 6.755615234375, 7.033203125, 7.310791015625, 7.58837890625, 7.865966796875, 8.1435546875, 8.421142578125, 8.69873046875, 8.976318359375, 9.25390625, 9.531494140625, 9.80908203125, 10.086669921875, 10.3642578125, 10.641845703125, 10.91943359375, 11.197021484375, 11.474609375, 11.752197265625, 12.02978515625, 12.307373046875, 12.5849609375, 12.862548828125, 13.14013671875, 13.417724609375, 13.6953125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 11.0, 14.0, 30.0, 112.0, 289.0, 893.0, 19718.0, 4168527.0, 3423.0, 719.0, 291.0, 133.0, 53.0, 29.0, 21.0, 7.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-182.375, -171.822265625, -161.26953125, -150.716796875, -140.1640625, -129.611328125, -119.05859375, -108.505859375, -97.953125, -87.400390625, -76.84765625, -66.294921875, -55.7421875, -45.189453125, -34.63671875, -24.083984375, -13.53125, -2.978515625, 7.57421875, 18.126953125, 28.6796875, 39.232421875, 49.78515625, 60.337890625, 70.890625, 81.443359375, 91.99609375, 102.548828125, 113.1015625, 123.654296875, 134.20703125, 144.759765625, 155.3125, 165.865234375, 176.41796875, 186.970703125, 197.5234375, 208.076171875, 218.62890625, 229.181640625, 239.734375, 250.287109375, 260.83984375, 271.392578125, 281.9453125, 292.498046875, 303.05078125, 313.603515625, 324.15625, 334.708984375, 345.26171875, 355.814453125, 366.3671875, 376.919921875, 387.47265625, 398.025390625, 408.578125, 419.130859375, 429.68359375, 440.236328125, 450.7890625, 461.341796875, 471.89453125, 482.447265625, 493.0]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 11.0, 28.0, 46.0, 195.0, 849.0, 2485.0, 277.0, 94.0, 38.0, 18.0, 12.0, 8.0, 3.0, 5.0, 1.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0078125, -8.3221435546875, -7.636474609375, -6.9508056640625, -6.26513671875, -5.5794677734375, -4.893798828125, -4.2081298828125, -3.5224609375, -2.8367919921875, -2.151123046875, -1.4654541015625, -0.77978515625, -0.0941162109375, 0.591552734375, 1.2772216796875, 1.962890625, 2.6485595703125, 3.334228515625, 4.0198974609375, 4.70556640625, 5.3912353515625, 6.076904296875, 6.7625732421875, 7.4482421875, 8.1339111328125, 8.819580078125, 9.5052490234375, 10.19091796875, 10.8765869140625, 11.562255859375, 12.2479248046875, 12.93359375, 13.6192626953125, 14.304931640625, 14.9906005859375, 15.67626953125, 16.3619384765625, 17.047607421875, 17.7332763671875, 18.4189453125, 19.1046142578125, 19.790283203125, 20.4759521484375, 21.16162109375, 21.8472900390625, 22.532958984375, 23.2186279296875, 23.904296875, 24.5899658203125, 25.275634765625, 25.9613037109375, 26.64697265625, 27.3326416015625, 28.018310546875, 28.7039794921875, 29.3896484375, 30.0753173828125, 30.760986328125, 31.4466552734375, 32.13232421875, 32.8179931640625, 33.503662109375, 34.1893310546875, 34.875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 12.0, 381.0, 557.0, 45.0, 8.0, 1.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-802.9163208007812, -781.8193359375, -760.722412109375, -739.62548828125, -718.5285034179688, -697.4315185546875, -676.3345947265625, -655.2376708984375, -634.1406860351562, -613.043701171875, -591.94677734375, -570.849853515625, -549.7528686523438, -528.6558837890625, -507.5589599609375, -486.4620056152344, -465.36505126953125, -444.2680969238281, -423.171142578125, -402.0741882324219, -380.97723388671875, -359.8802795410156, -338.7833251953125, -317.6863708496094, -296.58941650390625, -275.4924621582031, -254.3955078125, -233.29855346679688, -212.20159912109375, -191.10464477539062, -170.0076904296875, -148.91073608398438, -127.81378173828125, -106.71682739257812, -85.619873046875, -64.52291870117188, -43.42596435546875, -22.329010009765625, -1.2320556640625, 19.864898681640625, 40.96185302734375, 62.058807373046875, 83.15576171875, 104.25271606445312, 125.34967041015625, 146.44662475585938, 167.5435791015625, 188.64053344726562, 209.73748779296875, 230.83444213867188, 251.931396484375, 273.0283508300781, 294.12530517578125, 315.2222595214844, 336.3192138671875, 357.4161682128906, 378.51312255859375, 399.6100769042969, 420.70703125, 441.8039855957031, 462.90093994140625, 483.9978942871094, 505.0948486328125, 526.1917724609375, 547.2887573242188]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 8.0, 7.0, 11.0, 25.0, 25.0, 48.0, 73.0, 69.0, 96.0, 104.0, 85.0, 93.0, 86.0, 77.0, 61.0, 45.0, 31.0, 27.0, 19.0, 11.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-100.93111419677734, -97.49193572998047, -94.05274963378906, -90.61357116699219, -87.17439270019531, -83.7352066040039, -80.29602813720703, -76.85684204101562, -73.41766357421875, -69.97848510742188, -66.53929901123047, -63.100120544433594, -59.66093826293945, -56.22175598144531, -52.78257751464844, -49.3433952331543, -45.904212951660156, -42.465030670166016, -39.025848388671875, -35.586669921875, -32.14748764038086, -28.70830535888672, -25.26912498474121, -21.829944610595703, -18.390762329101562, -14.951581001281738, -11.512399673461914, -8.07321834564209, -4.634037017822266, -1.194854736328125, 2.244325637817383, 5.683506011962891, 9.122695922851562, 12.561877250671387, 16.00105857849121, 19.44023895263672, 22.87942123413086, 26.318603515625, 29.757783889770508, 33.196964263916016, 36.636146545410156, 40.0753288269043, 43.51451110839844, 46.95368957519531, 50.39287185668945, 53.832054138183594, 57.27123260498047, 60.71041488647461, 64.14959716796875, 67.58877563476562, 71.02796173095703, 74.4671401977539, 77.90632629394531, 81.34550476074219, 84.78468322753906, 88.22386169433594, 91.66304779052734, 95.10222625732422, 98.54141235351562, 101.9805908203125, 105.41976928710938, 108.85895538330078, 112.29813385009766, 115.73731994628906, 119.17649841308594]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 7.0, 8.0, 12.0, 12.0, 24.0, 25.0, 28.0, 50.0, 58.0, 95.0, 148.0, 204.0, 359.0, 556.0, 1332.0, 3798.0, 14745.0, 83582.0, 613394.0, 280711.0, 37122.0, 7781.0, 2302.0, 919.0, 465.0, 249.0, 170.0, 111.0, 97.0, 50.0, 31.0, 31.0, 22.0, 17.0, 10.0, 11.0, 5.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.125, -69.080078125, -67.03515625, -64.990234375, -62.9453125, -60.900390625, -58.85546875, -56.810546875, -54.765625, -52.720703125, -50.67578125, -48.630859375, -46.5859375, -44.541015625, -42.49609375, -40.451171875, -38.40625, -36.361328125, -34.31640625, -32.271484375, -30.2265625, -28.181640625, -26.13671875, -24.091796875, -22.046875, -20.001953125, -17.95703125, -15.912109375, -13.8671875, -11.822265625, -9.77734375, -7.732421875, -5.6875, -3.642578125, -1.59765625, 0.447265625, 2.4921875, 4.537109375, 6.58203125, 8.626953125, 10.671875, 12.716796875, 14.76171875, 16.806640625, 18.8515625, 20.896484375, 22.94140625, 24.986328125, 27.03125, 29.076171875, 31.12109375, 33.166015625, 35.2109375, 37.255859375, 39.30078125, 41.345703125, 43.390625, 45.435546875, 47.48046875, 49.525390625, 51.5703125, 53.615234375, 55.66015625, 57.705078125, 59.75]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 8.0, 7.0, 6.0, 21.0, 32.0, 35.0, 55.0, 69.0, 90.0, 115.0, 97.0, 106.0, 98.0, 74.0, 62.0, 50.0, 29.0, 17.0, 16.0, 9.0, 6.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.18359375, -5.87078857421875, -5.5579833984375, -5.24517822265625, -4.932373046875, -4.61956787109375, -4.3067626953125, -3.99395751953125, -3.68115234375, -3.36834716796875, -3.0555419921875, -2.74273681640625, -2.429931640625, -2.11712646484375, -1.8043212890625, -1.49151611328125, -1.1787109375, -0.86590576171875, -0.5531005859375, -0.24029541015625, 0.072509765625, 0.38531494140625, 0.6981201171875, 1.01092529296875, 1.32373046875, 1.63653564453125, 1.9493408203125, 2.26214599609375, 2.574951171875, 2.88775634765625, 3.2005615234375, 3.51336669921875, 3.826171875, 4.13897705078125, 4.4517822265625, 4.76458740234375, 5.077392578125, 5.39019775390625, 5.7030029296875, 6.01580810546875, 6.32861328125, 6.64141845703125, 6.9542236328125, 7.26702880859375, 7.579833984375, 7.89263916015625, 8.2054443359375, 8.51824951171875, 8.8310546875, 9.14385986328125, 9.4566650390625, 9.76947021484375, 10.082275390625, 10.39508056640625, 10.7078857421875, 11.02069091796875, 11.33349609375, 11.64630126953125, 11.9591064453125, 12.27191162109375, 12.584716796875, 12.89752197265625, 13.2103271484375, 13.52313232421875, 13.8359375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 13.0, 5.0, 10.0, 14.0, 23.0, 38.0, 51.0, 77.0, 120.0, 186.0, 285.0, 419.0, 833.0, 1679.0, 4345.0, 14416.0, 77160.0, 586507.0, 308937.0, 38507.0, 8983.0, 2903.0, 1327.0, 662.0, 373.0, 218.0, 141.0, 87.0, 69.0, 41.0, 33.0, 30.0, 15.0, 10.0, 9.0, 6.0, 4.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-54.6875, -53.11669921875, -51.5458984375, -49.97509765625, -48.404296875, -46.83349609375, -45.2626953125, -43.69189453125, -42.12109375, -40.55029296875, -38.9794921875, -37.40869140625, -35.837890625, -34.26708984375, -32.6962890625, -31.12548828125, -29.5546875, -27.98388671875, -26.4130859375, -24.84228515625, -23.271484375, -21.70068359375, -20.1298828125, -18.55908203125, -16.98828125, -15.41748046875, -13.8466796875, -12.27587890625, -10.705078125, -9.13427734375, -7.5634765625, -5.99267578125, -4.421875, -2.85107421875, -1.2802734375, 0.29052734375, 1.861328125, 3.43212890625, 5.0029296875, 6.57373046875, 8.14453125, 9.71533203125, 11.2861328125, 12.85693359375, 14.427734375, 15.99853515625, 17.5693359375, 19.14013671875, 20.7109375, 22.28173828125, 23.8525390625, 25.42333984375, 26.994140625, 28.56494140625, 30.1357421875, 31.70654296875, 33.27734375, 34.84814453125, 36.4189453125, 37.98974609375, 39.560546875, 41.13134765625, 42.7021484375, 44.27294921875, 45.84375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 5.0, 12.0, 10.0, 7.0, 12.0, 32.0, 30.0, 30.0, 27.0, 37.0, 51.0, 38.0, 46.0, 42.0, 55.0, 51.0, 67.0, 46.0, 50.0, 52.0, 60.0, 45.0, 35.0, 30.0, 15.0, 19.0, 19.0, 13.0, 19.0, 12.0, 11.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-27.515625, -26.78759765625, -26.0595703125, -25.33154296875, -24.603515625, -23.87548828125, -23.1474609375, -22.41943359375, -21.69140625, -20.96337890625, -20.2353515625, -19.50732421875, -18.779296875, -18.05126953125, -17.3232421875, -16.59521484375, -15.8671875, -15.13916015625, -14.4111328125, -13.68310546875, -12.955078125, -12.22705078125, -11.4990234375, -10.77099609375, -10.04296875, -9.31494140625, -8.5869140625, -7.85888671875, -7.130859375, -6.40283203125, -5.6748046875, -4.94677734375, -4.21875, -3.49072265625, -2.7626953125, -2.03466796875, -1.306640625, -0.57861328125, 0.1494140625, 0.87744140625, 1.60546875, 2.33349609375, 3.0615234375, 3.78955078125, 4.517578125, 5.24560546875, 5.9736328125, 6.70166015625, 7.4296875, 8.15771484375, 8.8857421875, 9.61376953125, 10.341796875, 11.06982421875, 11.7978515625, 12.52587890625, 13.25390625, 13.98193359375, 14.7099609375, 15.43798828125, 16.166015625, 16.89404296875, 17.6220703125, 18.35009765625, 19.078125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 3.0, 6.0, 3.0, 4.0, 6.0, 8.0, 15.0, 21.0, 28.0, 33.0, 53.0, 88.0, 135.0, 250.0, 449.0, 896.0, 1870.0, 4802.0, 14358.0, 56511.0, 367654.0, 496004.0, 76971.0, 18070.0, 5825.0, 2264.0, 1051.0, 460.0, 243.0, 160.0, 96.0, 62.0, 49.0, 29.0, 21.0, 17.0, 7.0, 4.0, 9.0, 5.0, 1.0, 6.0, 1.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-18.625, -18.044677734375, -17.46435546875, -16.884033203125, -16.3037109375, -15.723388671875, -15.14306640625, -14.562744140625, -13.982421875, -13.402099609375, -12.82177734375, -12.241455078125, -11.6611328125, -11.080810546875, -10.50048828125, -9.920166015625, -9.33984375, -8.759521484375, -8.17919921875, -7.598876953125, -7.0185546875, -6.438232421875, -5.85791015625, -5.277587890625, -4.697265625, -4.116943359375, -3.53662109375, -2.956298828125, -2.3759765625, -1.795654296875, -1.21533203125, -0.635009765625, -0.0546875, 0.525634765625, 1.10595703125, 1.686279296875, 2.2666015625, 2.846923828125, 3.42724609375, 4.007568359375, 4.587890625, 5.168212890625, 5.74853515625, 6.328857421875, 6.9091796875, 7.489501953125, 8.06982421875, 8.650146484375, 9.23046875, 9.810791015625, 10.39111328125, 10.971435546875, 11.5517578125, 12.132080078125, 12.71240234375, 13.292724609375, 13.873046875, 14.453369140625, 15.03369140625, 15.614013671875, 16.1943359375, 16.774658203125, 17.35498046875, 17.935302734375, 18.515625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 8.0, 3.0, 8.0, 9.0, 9.0, 15.0, 29.0, 30.0, 29.0, 60.0, 71.0, 83.0, 124.0, 81.0, 98.0, 74.0, 68.0, 51.0, 34.0, 35.0, 24.0, 14.0, 7.0, 12.0, 5.0, 6.0, 2.0, 2.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00232696533203125, -0.002238750457763672, -0.0021505355834960938, -0.0020623207092285156, -0.0019741058349609375, -0.0018858909606933594, -0.0017976760864257812, -0.0017094612121582031, -0.001621246337890625, -0.0015330314636230469, -0.0014448165893554688, -0.0013566017150878906, -0.0012683868408203125, -0.0011801719665527344, -0.0010919570922851562, -0.0010037422180175781, -0.00091552734375, -0.0008273124694824219, -0.0007390975952148438, -0.0006508827209472656, -0.0005626678466796875, -0.0004744529724121094, -0.00038623809814453125, -0.0002980232238769531, -0.000209808349609375, -0.00012159347534179688, -3.337860107421875e-05, 5.4836273193359375e-05, 0.0001430511474609375, 0.00023126602172851562, 0.00031948089599609375, 0.0004076957702636719, 0.00049591064453125, 0.0005841255187988281, 0.0006723403930664062, 0.0007605552673339844, 0.0008487701416015625, 0.0009369850158691406, 0.0010251998901367188, 0.0011134147644042969, 0.001201629638671875, 0.0012898445129394531, 0.0013780593872070312, 0.0014662742614746094, 0.0015544891357421875, 0.0016427040100097656, 0.0017309188842773438, 0.0018191337585449219, 0.0019073486328125, 0.001995563507080078, 0.0020837783813476562, 0.0021719932556152344, 0.0022602081298828125, 0.0023484230041503906, 0.0024366378784179688, 0.002524852752685547, 0.002613067626953125, 0.002701282501220703, 0.0027894973754882812, 0.0028777122497558594, 0.0029659271240234375, 0.0030541419982910156, 0.0031423568725585938, 0.003230571746826172, 0.00331878662109375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 1.0, 1.0, 2.0, 6.0, 4.0, 4.0, 6.0, 7.0, 9.0, 14.0, 21.0, 21.0, 38.0, 55.0, 65.0, 99.0, 193.0, 298.0, 505.0, 1096.0, 2404.0, 6952.0, 26421.0, 216783.0, 689413.0, 81328.0, 14715.0, 4466.0, 1680.0, 830.0, 436.0, 243.0, 133.0, 100.0, 67.0, 44.0, 28.0, 16.0, 14.0, 10.0, 4.0, 7.0, 5.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.609375, -19.950927734375, -19.29248046875, -18.634033203125, -17.9755859375, -17.317138671875, -16.65869140625, -16.000244140625, -15.341796875, -14.683349609375, -14.02490234375, -13.366455078125, -12.7080078125, -12.049560546875, -11.39111328125, -10.732666015625, -10.07421875, -9.415771484375, -8.75732421875, -8.098876953125, -7.4404296875, -6.781982421875, -6.12353515625, -5.465087890625, -4.806640625, -4.148193359375, -3.48974609375, -2.831298828125, -2.1728515625, -1.514404296875, -0.85595703125, -0.197509765625, 0.4609375, 1.119384765625, 1.77783203125, 2.436279296875, 3.0947265625, 3.753173828125, 4.41162109375, 5.070068359375, 5.728515625, 6.386962890625, 7.04541015625, 7.703857421875, 8.3623046875, 9.020751953125, 9.67919921875, 10.337646484375, 10.99609375, 11.654541015625, 12.31298828125, 12.971435546875, 13.6298828125, 14.288330078125, 14.94677734375, 15.605224609375, 16.263671875, 16.922119140625, 17.58056640625, 18.239013671875, 18.8974609375, 19.555908203125, 20.21435546875, 20.872802734375, 21.53125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 8.0, 3.0, 6.0, 8.0, 10.0, 10.0, 19.0, 20.0, 25.0, 31.0, 36.0, 55.0, 48.0, 68.0, 85.0, 76.0, 85.0, 98.0, 54.0, 62.0, 31.0, 33.0, 25.0, 11.0, 18.0, 18.0, 8.0, 10.0, 8.0, 6.0, 6.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.21875, -7.924560546875, -7.63037109375, -7.336181640625, -7.0419921875, -6.747802734375, -6.45361328125, -6.159423828125, -5.865234375, -5.571044921875, -5.27685546875, -4.982666015625, -4.6884765625, -4.394287109375, -4.10009765625, -3.805908203125, -3.51171875, -3.217529296875, -2.92333984375, -2.629150390625, -2.3349609375, -2.040771484375, -1.74658203125, -1.452392578125, -1.158203125, -0.864013671875, -0.56982421875, -0.275634765625, 0.0185546875, 0.312744140625, 0.60693359375, 0.901123046875, 1.1953125, 1.489501953125, 1.78369140625, 2.077880859375, 2.3720703125, 2.666259765625, 2.96044921875, 3.254638671875, 3.548828125, 3.843017578125, 4.13720703125, 4.431396484375, 4.7255859375, 5.019775390625, 5.31396484375, 5.608154296875, 5.90234375, 6.196533203125, 6.49072265625, 6.784912109375, 7.0791015625, 7.373291015625, 7.66748046875, 7.961669921875, 8.255859375, 8.550048828125, 8.84423828125, 9.138427734375, 9.4326171875, 9.726806640625, 10.02099609375, 10.315185546875, 10.609375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 21.0, 116.0, 307.0, 362.0, 125.0, 35.0, 10.0, 9.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-608.5933837890625, -593.8239135742188, -579.0543823242188, -564.284912109375, -549.5154418945312, -534.7459106445312, -519.9764404296875, -505.2069396972656, -490.43743896484375, -475.6679382324219, -460.8984680175781, -446.12896728515625, -431.3594665527344, -416.5899658203125, -401.82049560546875, -387.0509948730469, -372.2815246582031, -357.51202392578125, -342.7425537109375, -327.9730529785156, -313.20355224609375, -298.43408203125, -283.6645812988281, -268.89508056640625, -254.12559509277344, -239.35610961914062, -224.58660888671875, -209.81712341308594, -195.04763793945312, -180.27813720703125, -165.50865173339844, -150.73916625976562, -135.96963500976562, -121.20014190673828, -106.43064880371094, -91.66116333007812, -76.89167022705078, -62.12217712402344, -47.352691650390625, -32.58319854736328, -17.813705444335938, -3.0442142486572266, 11.725276947021484, 26.494766235351562, 41.264259338378906, 56.03375244140625, 70.80323791503906, 85.5727310180664, 100.34222412109375, 115.1117172241211, 129.88121032714844, 144.65069580078125, 159.42019653320312, 174.18968200683594, 188.95916748046875, 203.72866821289062, 218.49815368652344, 233.26763916015625, 248.03713989257812, 262.806640625, 277.57611083984375, 292.3456115722656, 307.1151123046875, 321.88458251953125, 336.6540832519531]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 4.0, 3.0, 4.0, 6.0, 6.0, 9.0, 20.0, 10.0, 22.0, 24.0, 37.0, 31.0, 44.0, 35.0, 44.0, 56.0, 51.0, 76.0, 57.0, 69.0, 50.0, 59.0, 60.0, 39.0, 35.0, 29.0, 30.0, 28.0, 21.0, 8.0, 10.0, 10.0, 8.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.98085021972656, -113.7710189819336, -109.56118774414062, -105.35135650634766, -101.14152526855469, -96.93169403076172, -92.72186279296875, -88.51202392578125, -84.30220031738281, -80.09236907958984, -75.88253784179688, -71.6727066040039, -67.46287536621094, -63.25304412841797, -59.043209075927734, -54.833377838134766, -50.62354278564453, -46.41371154785156, -42.203880310058594, -37.994049072265625, -33.784217834472656, -29.574384689331055, -25.364551544189453, -21.154720306396484, -16.944889068603516, -12.735057830810547, -8.525225639343262, -4.315393447875977, -0.10556221008300781, 4.104269027709961, 8.314102172851562, 12.523933410644531, 16.7337646484375, 20.94359588623047, 25.153427124023438, 29.36326026916504, 33.573089599609375, 37.782920837402344, 41.99275588989258, 46.20258712768555, 50.412418365478516, 54.622249603271484, 58.83208084106445, 63.04191589355469, 67.25174713134766, 71.46157836914062, 75.6714096069336, 79.88124084472656, 84.09107208251953, 88.3009033203125, 92.51073455810547, 96.72056579589844, 100.9303970336914, 105.14022827148438, 109.35006713867188, 113.55989074707031, 117.76972961425781, 121.97956085205078, 126.18939208984375, 130.39923095703125, 134.6090545654297, 138.8188934326172, 143.02871704101562, 147.23855590820312, 151.44837951660156]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 5.0, 2.0, 1.0, 6.0, 12.0, 20.0, 35.0, 38.0, 131.0, 300.0, 967.0, 5771.0, 93741.0, 4055978.0, 32269.0, 3288.0, 885.0, 365.0, 194.0, 105.0, 74.0, 38.0, 19.0, 16.0, 8.0, 4.0, 11.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.75, -57.25, -53.75, -50.25, -46.75, -43.25, -39.75, -36.25, -32.75, -29.25, -25.75, -22.25, -18.75, -15.25, -11.75, -8.25, -4.75, -1.25, 2.25, 5.75, 9.25, 12.75, 16.25, 19.75, 23.25, 26.75, 30.25, 33.75, 37.25, 40.75, 44.25, 47.75, 51.25, 54.75, 58.25, 61.75, 65.25, 68.75, 72.25, 75.75, 79.25, 82.75, 86.25, 89.75, 93.25, 96.75, 100.25, 103.75, 107.25, 110.75, 114.25, 117.75, 121.25, 124.75, 128.25, 131.75, 135.25, 138.75, 142.25, 145.75, 149.25, 152.75, 156.25, 159.75, 163.25]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 10.0, 12.0, 21.0, 24.0, 34.0, 49.0, 77.0, 86.0, 98.0, 108.0, 99.0, 102.0, 71.0, 72.0, 44.0, 29.0, 27.0, 15.0, 6.0, 5.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.734375, -5.4296875, -5.125, -4.8203125, -4.515625, -4.2109375, -3.90625, -3.6015625, -3.296875, -2.9921875, -2.6875, -2.3828125, -2.078125, -1.7734375, -1.46875, -1.1640625, -0.859375, -0.5546875, -0.25, 0.0546875, 0.359375, 0.6640625, 0.96875, 1.2734375, 1.578125, 1.8828125, 2.1875, 2.4921875, 2.796875, 3.1015625, 3.40625, 3.7109375, 4.015625, 4.3203125, 4.625, 4.9296875, 5.234375, 5.5390625, 5.84375, 6.1484375, 6.453125, 6.7578125, 7.0625, 7.3671875, 7.671875, 7.9765625, 8.28125, 8.5859375, 8.890625, 9.1953125, 9.5, 9.8046875, 10.109375, 10.4140625, 10.71875, 11.0234375, 11.328125, 11.6328125, 11.9375, 12.2421875, 12.546875, 12.8515625, 13.15625, 13.4609375, 13.765625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 13.0, 14.0, 24.0, 26.0, 40.0, 71.0, 82.0, 168.0, 526.0, 4084063.0, 108506.0, 431.0, 156.0, 63.0, 41.0, 28.0, 17.0, 10.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-631.5, -615.68359375, -599.8671875, -584.05078125, -568.234375, -552.41796875, -536.6015625, -520.78515625, -504.96875, -489.15234375, -473.3359375, -457.51953125, -441.703125, -425.88671875, -410.0703125, -394.25390625, -378.4375, -362.62109375, -346.8046875, -330.98828125, -315.171875, -299.35546875, -283.5390625, -267.72265625, -251.90625, -236.08984375, -220.2734375, -204.45703125, -188.640625, -172.82421875, -157.0078125, -141.19140625, -125.375, -109.55859375, -93.7421875, -77.92578125, -62.109375, -46.29296875, -30.4765625, -14.66015625, 1.15625, 16.97265625, 32.7890625, 48.60546875, 64.421875, 80.23828125, 96.0546875, 111.87109375, 127.6875, 143.50390625, 159.3203125, 175.13671875, 190.953125, 206.76953125, 222.5859375, 238.40234375, 254.21875, 270.03515625, 285.8515625, 301.66796875, 317.484375, 333.30078125, 349.1171875, 364.93359375, 380.75]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 13.0, 63.0, 1419.0, 2488.0, 83.0, 15.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.5, -90.613037109375, -88.72607421875, -86.839111328125, -84.9521484375, -83.065185546875, -81.17822265625, -79.291259765625, -77.404296875, -75.517333984375, -73.63037109375, -71.743408203125, -69.8564453125, -67.969482421875, -66.08251953125, -64.195556640625, -62.30859375, -60.421630859375, -58.53466796875, -56.647705078125, -54.7607421875, -52.873779296875, -50.98681640625, -49.099853515625, -47.212890625, -45.325927734375, -43.43896484375, -41.552001953125, -39.6650390625, -37.778076171875, -35.89111328125, -34.004150390625, -32.1171875, -30.230224609375, -28.34326171875, -26.456298828125, -24.5693359375, -22.682373046875, -20.79541015625, -18.908447265625, -17.021484375, -15.134521484375, -13.24755859375, -11.360595703125, -9.4736328125, -7.586669921875, -5.69970703125, -3.812744140625, -1.92578125, -0.038818359375, 1.84814453125, 3.735107421875, 5.6220703125, 7.509033203125, 9.39599609375, 11.282958984375, 13.169921875, 15.056884765625, 16.94384765625, 18.830810546875, 20.7177734375, 22.604736328125, 24.49169921875, 26.378662109375, 28.265625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 75.0, 908.0, 19.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-679.7140502929688, -650.5458984375, -621.377685546875, -592.2095336914062, -563.0413818359375, -533.8732299804688, -504.7050476074219, -475.536865234375, -446.36871337890625, -417.2005615234375, -388.0323791503906, -358.86419677734375, -329.696044921875, -300.52789306640625, -271.3597106933594, -242.19154357910156, -213.02337646484375, -183.85520935058594, -154.68704223632812, -125.51887512207031, -96.3507080078125, -67.18254089355469, -38.014373779296875, -8.846206665039062, 20.32196044921875, 49.49012756347656, 78.65829467773438, 107.82646179199219, 136.99462890625, 166.1627960205078, 195.33096313476562, 224.49913024902344, 253.6673583984375, 282.83551025390625, 312.0036926269531, 341.171875, 370.34002685546875, 399.5081787109375, 428.6763610839844, 457.84454345703125, 487.0126953125, 516.1808471679688, 545.3489990234375, 574.5172119140625, 603.6853637695312, 632.853515625, 662.021728515625, 691.1898803710938, 720.3580322265625, 749.5261840820312, 778.6943359375, 807.862548828125, 837.0307006835938, 866.1988525390625, 895.3670654296875, 924.5352172851562, 953.703369140625, 982.8715209960938, 1012.0396728515625, 1041.2078857421875, 1070.3759765625, 1099.544189453125, 1128.71240234375, 1157.8804931640625, 1187.0487060546875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 7.0, 16.0, 35.0, 78.0, 98.0, 120.0, 153.0, 133.0, 125.0, 98.0, 68.0, 42.0, 19.0, 9.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-107.30892181396484, -103.36298370361328, -99.41704559326172, -95.47110748291016, -91.5251693725586, -87.57923126220703, -83.63328552246094, -79.68734741210938, -75.74140930175781, -71.79547119140625, -67.84953308105469, -63.903594970703125, -59.95765686035156, -56.01171875, -52.06577682495117, -48.11983871459961, -44.17390441894531, -40.22796630859375, -36.28202819824219, -32.336090087890625, -28.39015007019043, -24.444211959838867, -20.498271942138672, -16.55233383178711, -12.606395721435547, -8.660457611083984, -4.7145185470581055, -0.7685794830322266, 3.177358627319336, 7.123296737670898, 11.069236755371094, 15.015174865722656, 18.961105346679688, 22.90704345703125, 26.852981567382812, 30.798921585083008, 34.74485778808594, 38.6907958984375, 42.63673782348633, 46.58267593383789, 50.52861404418945, 54.474552154541016, 58.42049026489258, 62.366432189941406, 66.31237030029297, 70.25830841064453, 74.2042465209961, 78.15018463134766, 82.09612274169922, 86.04206085205078, 89.98799896240234, 93.9339370727539, 97.87987518310547, 101.82581329345703, 105.77175903320312, 109.71769714355469, 113.66363525390625, 117.60957336425781, 121.55551147460938, 125.50144958496094, 129.4473876953125, 133.39332580566406, 137.33926391601562, 141.2852020263672, 145.23114013671875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 5.0, 7.0, 12.0, 14.0, 16.0, 19.0, 30.0, 54.0, 43.0, 70.0, 95.0, 174.0, 216.0, 407.0, 644.0, 1188.0, 2392.0, 4981.0, 12026.0, 31395.0, 100258.0, 341242.0, 376899.0, 116214.0, 35913.0, 13014.0, 5460.0, 2600.0, 1253.0, 689.0, 383.0, 255.0, 152.0, 95.0, 81.0, 64.0, 44.0, 39.0, 28.0, 18.0, 13.0, 12.0, 6.0, 10.0, 6.0, 5.0, 3.0, 2.0, 8.0], "bins": [-36.75, -35.75830078125, -34.7666015625, -33.77490234375, -32.783203125, -31.79150390625, -30.7998046875, -29.80810546875, -28.81640625, -27.82470703125, -26.8330078125, -25.84130859375, -24.849609375, -23.85791015625, -22.8662109375, -21.87451171875, -20.8828125, -19.89111328125, -18.8994140625, -17.90771484375, -16.916015625, -15.92431640625, -14.9326171875, -13.94091796875, -12.94921875, -11.95751953125, -10.9658203125, -9.97412109375, -8.982421875, -7.99072265625, -6.9990234375, -6.00732421875, -5.015625, -4.02392578125, -3.0322265625, -2.04052734375, -1.048828125, -0.05712890625, 0.9345703125, 1.92626953125, 2.91796875, 3.90966796875, 4.9013671875, 5.89306640625, 6.884765625, 7.87646484375, 8.8681640625, 9.85986328125, 10.8515625, 11.84326171875, 12.8349609375, 13.82666015625, 14.818359375, 15.81005859375, 16.8017578125, 17.79345703125, 18.78515625, 19.77685546875, 20.7685546875, 21.76025390625, 22.751953125, 23.74365234375, 24.7353515625, 25.72705078125, 26.71875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 9.0, 5.0, 17.0, 22.0, 32.0, 34.0, 33.0, 49.0, 63.0, 72.0, 81.0, 82.0, 88.0, 87.0, 66.0, 53.0, 47.0, 36.0, 42.0, 26.0, 13.0, 10.0, 18.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.328125, -6.0931396484375, -5.858154296875, -5.6231689453125, -5.38818359375, -5.1531982421875, -4.918212890625, -4.6832275390625, -4.4482421875, -4.2132568359375, -3.978271484375, -3.7432861328125, -3.50830078125, -3.2733154296875, -3.038330078125, -2.8033447265625, -2.568359375, -2.3333740234375, -2.098388671875, -1.8634033203125, -1.62841796875, -1.3934326171875, -1.158447265625, -0.9234619140625, -0.6884765625, -0.4534912109375, -0.218505859375, 0.0164794921875, 0.25146484375, 0.4864501953125, 0.721435546875, 0.9564208984375, 1.19140625, 1.4263916015625, 1.661376953125, 1.8963623046875, 2.13134765625, 2.3663330078125, 2.601318359375, 2.8363037109375, 3.0712890625, 3.3062744140625, 3.541259765625, 3.7762451171875, 4.01123046875, 4.2462158203125, 4.481201171875, 4.7161865234375, 4.951171875, 5.1861572265625, 5.421142578125, 5.6561279296875, 5.89111328125, 6.1260986328125, 6.361083984375, 6.5960693359375, 6.8310546875, 7.0660400390625, 7.301025390625, 7.5360107421875, 7.77099609375, 8.0059814453125, 8.240966796875, 8.4759521484375, 8.7109375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 8.0, 3.0, 9.0, 9.0, 8.0, 14.0, 21.0, 30.0, 34.0, 52.0, 77.0, 114.0, 137.0, 243.0, 340.0, 546.0, 1006.0, 2031.0, 4667.0, 14164.0, 60415.0, 387537.0, 474375.0, 75773.0, 16514.0, 5352.0, 2186.0, 1142.0, 580.0, 394.0, 216.0, 148.0, 105.0, 87.0, 65.0, 41.0, 32.0, 26.0, 11.0, 11.0, 13.0, 7.0, 1.0, 1.0, 4.0, 4.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.78125, -40.3916015625, -39.001953125, -37.6123046875, -36.22265625, -34.8330078125, -33.443359375, -32.0537109375, -30.6640625, -29.2744140625, -27.884765625, -26.4951171875, -25.10546875, -23.7158203125, -22.326171875, -20.9365234375, -19.546875, -18.1572265625, -16.767578125, -15.3779296875, -13.98828125, -12.5986328125, -11.208984375, -9.8193359375, -8.4296875, -7.0400390625, -5.650390625, -4.2607421875, -2.87109375, -1.4814453125, -0.091796875, 1.2978515625, 2.6875, 4.0771484375, 5.466796875, 6.8564453125, 8.24609375, 9.6357421875, 11.025390625, 12.4150390625, 13.8046875, 15.1943359375, 16.583984375, 17.9736328125, 19.36328125, 20.7529296875, 22.142578125, 23.5322265625, 24.921875, 26.3115234375, 27.701171875, 29.0908203125, 30.48046875, 31.8701171875, 33.259765625, 34.6494140625, 36.0390625, 37.4287109375, 38.818359375, 40.2080078125, 41.59765625, 42.9873046875, 44.376953125, 45.7666015625, 47.15625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 5.0, 3.0, 3.0, 8.0, 8.0, 8.0, 11.0, 16.0, 18.0, 25.0, 19.0, 31.0, 41.0, 33.0, 36.0, 56.0, 44.0, 63.0, 46.0, 43.0, 49.0, 64.0, 28.0, 42.0, 46.0, 40.0, 36.0, 20.0, 25.0, 29.0, 15.0, 13.0, 15.0, 12.0, 10.0, 9.0, 10.0, 5.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.640625, -19.92333984375, -19.2060546875, -18.48876953125, -17.771484375, -17.05419921875, -16.3369140625, -15.61962890625, -14.90234375, -14.18505859375, -13.4677734375, -12.75048828125, -12.033203125, -11.31591796875, -10.5986328125, -9.88134765625, -9.1640625, -8.44677734375, -7.7294921875, -7.01220703125, -6.294921875, -5.57763671875, -4.8603515625, -4.14306640625, -3.42578125, -2.70849609375, -1.9912109375, -1.27392578125, -0.556640625, 0.16064453125, 0.8779296875, 1.59521484375, 2.3125, 3.02978515625, 3.7470703125, 4.46435546875, 5.181640625, 5.89892578125, 6.6162109375, 7.33349609375, 8.05078125, 8.76806640625, 9.4853515625, 10.20263671875, 10.919921875, 11.63720703125, 12.3544921875, 13.07177734375, 13.7890625, 14.50634765625, 15.2236328125, 15.94091796875, 16.658203125, 17.37548828125, 18.0927734375, 18.81005859375, 19.52734375, 20.24462890625, 20.9619140625, 21.67919921875, 22.396484375, 23.11376953125, 23.8310546875, 24.54833984375, 25.265625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 9.0, 18.0, 25.0, 48.0, 51.0, 132.0, 290.0, 847.0, 4450.0, 81146.0, 938023.0, 20348.0, 2188.0, 547.0, 207.0, 99.0, 47.0, 31.0, 18.0, 17.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.1875, -63.169921875, -61.15234375, -59.134765625, -57.1171875, -55.099609375, -53.08203125, -51.064453125, -49.046875, -47.029296875, -45.01171875, -42.994140625, -40.9765625, -38.958984375, -36.94140625, -34.923828125, -32.90625, -30.888671875, -28.87109375, -26.853515625, -24.8359375, -22.818359375, -20.80078125, -18.783203125, -16.765625, -14.748046875, -12.73046875, -10.712890625, -8.6953125, -6.677734375, -4.66015625, -2.642578125, -0.625, 1.392578125, 3.41015625, 5.427734375, 7.4453125, 9.462890625, 11.48046875, 13.498046875, 15.515625, 17.533203125, 19.55078125, 21.568359375, 23.5859375, 25.603515625, 27.62109375, 29.638671875, 31.65625, 33.673828125, 35.69140625, 37.708984375, 39.7265625, 41.744140625, 43.76171875, 45.779296875, 47.796875, 49.814453125, 51.83203125, 53.849609375, 55.8671875, 57.884765625, 59.90234375, 61.919921875, 63.9375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 6.0, 3.0, 5.0, 9.0, 10.0, 14.0, 16.0, 21.0, 33.0, 40.0, 63.0, 86.0, 101.0, 120.0, 118.0, 106.0, 58.0, 48.0, 36.0, 24.0, 13.0, 20.0, 11.0, 8.0, 8.0, 2.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.004322052001953125, -0.00421065092086792, -0.004099249839782715, -0.00398784875869751, -0.0038764476776123047, -0.0037650465965270996, -0.0036536455154418945, -0.0035422444343566895, -0.0034308433532714844, -0.0033194422721862793, -0.0032080411911010742, -0.003096640110015869, -0.002985239028930664, -0.002873837947845459, -0.002762436866760254, -0.002651035785675049, -0.0025396347045898438, -0.0024282336235046387, -0.0023168325424194336, -0.0022054314613342285, -0.0020940303802490234, -0.0019826292991638184, -0.0018712282180786133, -0.0017598271369934082, -0.0016484260559082031, -0.001537024974822998, -0.001425623893737793, -0.0013142228126525879, -0.0012028217315673828, -0.0010914206504821777, -0.0009800195693969727, -0.0008686184883117676, -0.0007572174072265625, -0.0006458163261413574, -0.0005344152450561523, -0.00042301416397094727, -0.0003116130828857422, -0.0002002120018005371, -8.881092071533203e-05, 2.2590160369873047e-05, 0.00013399124145507812, 0.0002453923225402832, 0.0003567934036254883, 0.00046819448471069336, 0.0005795955657958984, 0.0006909966468811035, 0.0008023977279663086, 0.0009137988090515137, 0.0010251998901367188, 0.0011366009712219238, 0.001248002052307129, 0.001359403133392334, 0.001470804214477539, 0.0015822052955627441, 0.0016936063766479492, 0.0018050074577331543, 0.0019164085388183594, 0.0020278096199035645, 0.0021392107009887695, 0.0022506117820739746, 0.0023620128631591797, 0.0024734139442443848, 0.00258481502532959, 0.002696216106414795, 0.0028076171875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 9.0, 8.0, 21.0, 24.0, 24.0, 50.0, 86.0, 157.0, 370.0, 1098.0, 4885.0, 83748.0, 932720.0, 21332.0, 2697.0, 733.0, 248.0, 142.0, 71.0, 44.0, 25.0, 22.0, 6.0, 7.0, 8.0, 7.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.0625, -36.66943359375, -35.2763671875, -33.88330078125, -32.490234375, -31.09716796875, -29.7041015625, -28.31103515625, -26.91796875, -25.52490234375, -24.1318359375, -22.73876953125, -21.345703125, -19.95263671875, -18.5595703125, -17.16650390625, -15.7734375, -14.38037109375, -12.9873046875, -11.59423828125, -10.201171875, -8.80810546875, -7.4150390625, -6.02197265625, -4.62890625, -3.23583984375, -1.8427734375, -0.44970703125, 0.943359375, 2.33642578125, 3.7294921875, 5.12255859375, 6.515625, 7.90869140625, 9.3017578125, 10.69482421875, 12.087890625, 13.48095703125, 14.8740234375, 16.26708984375, 17.66015625, 19.05322265625, 20.4462890625, 21.83935546875, 23.232421875, 24.62548828125, 26.0185546875, 27.41162109375, 28.8046875, 30.19775390625, 31.5908203125, 32.98388671875, 34.376953125, 35.77001953125, 37.1630859375, 38.55615234375, 39.94921875, 41.34228515625, 42.7353515625, 44.12841796875, 45.521484375, 46.91455078125, 48.3076171875, 49.70068359375, 51.09375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 8.0, 25.0, 38.0, 76.0, 134.0, 209.0, 199.0, 132.0, 63.0, 51.0, 20.0, 9.0, 8.0, 5.0, 4.0, 1.0, 1.0, 5.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.953125, -18.16259765625, -17.3720703125, -16.58154296875, -15.791015625, -15.00048828125, -14.2099609375, -13.41943359375, -12.62890625, -11.83837890625, -11.0478515625, -10.25732421875, -9.466796875, -8.67626953125, -7.8857421875, -7.09521484375, -6.3046875, -5.51416015625, -4.7236328125, -3.93310546875, -3.142578125, -2.35205078125, -1.5615234375, -0.77099609375, 0.01953125, 0.81005859375, 1.6005859375, 2.39111328125, 3.181640625, 3.97216796875, 4.7626953125, 5.55322265625, 6.34375, 7.13427734375, 7.9248046875, 8.71533203125, 9.505859375, 10.29638671875, 11.0869140625, 11.87744140625, 12.66796875, 13.45849609375, 14.2490234375, 15.03955078125, 15.830078125, 16.62060546875, 17.4111328125, 18.20166015625, 18.9921875, 19.78271484375, 20.5732421875, 21.36376953125, 22.154296875, 22.94482421875, 23.7353515625, 24.52587890625, 25.31640625, 26.10693359375, 26.8974609375, 27.68798828125, 28.478515625, 29.26904296875, 30.0595703125, 30.85009765625, 31.640625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 14.0, 19.0, 57.0, 150.0, 263.0, 237.0, 146.0, 57.0, 29.0, 16.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-412.82196044921875, -400.672119140625, -388.5223083496094, -376.3724670410156, -364.22265625, -352.07281494140625, -339.9229736328125, -327.7731628417969, -315.6233215332031, -303.4734802246094, -291.32366943359375, -279.173828125, -267.0240173339844, -254.87417602539062, -242.72434997558594, -230.57452392578125, -218.42469787597656, -206.27487182617188, -194.1250457763672, -181.9752197265625, -169.82537841796875, -157.67555236816406, -145.52572631835938, -133.37588500976562, -121.22606658935547, -109.07624053955078, -96.92640686035156, -84.77658081054688, -72.62675476074219, -60.47692108154297, -48.32709503173828, -36.17726135253906, -24.027435302734375, -11.877606391906738, 0.27222251892089844, 12.422050476074219, 24.571880340576172, 36.721710205078125, 48.87153625488281, 61.02136993408203, 73.17119598388672, 85.3210220336914, 97.47085571289062, 109.62068176269531, 121.7705078125, 133.92034912109375, 146.07015991210938, 158.22000122070312, 170.3698272705078, 182.5196533203125, 194.6694793701172, 206.81930541992188, 218.96914672851562, 231.1189727783203, 243.268798828125, 255.41864013671875, 267.5684509277344, 279.7182922363281, 291.86810302734375, 304.0179443359375, 316.1677551269531, 328.3175964355469, 340.4674072265625, 352.61724853515625, 364.76708984375]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 4.0, 9.0, 9.0, 14.0, 12.0, 12.0, 22.0, 21.0, 29.0, 28.0, 30.0, 39.0, 38.0, 43.0, 46.0, 48.0, 54.0, 46.0, 53.0, 47.0, 40.0, 37.0, 53.0, 45.0, 45.0, 30.0, 33.0, 18.0, 17.0, 15.0, 21.0, 13.0, 9.0, 7.0, 2.0, 6.0, 3.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0], "bins": [-159.503173828125, -155.18508911132812, -150.86700439453125, -146.54891967773438, -142.2308349609375, -137.91275024414062, -133.59466552734375, -129.2765655517578, -124.95848083496094, -120.64039611816406, -116.32231140136719, -112.00422668457031, -107.6861343383789, -103.36804962158203, -99.04996490478516, -94.73188018798828, -90.4137954711914, -86.09571075439453, -81.77762603759766, -77.45953369140625, -73.14144897460938, -68.8233642578125, -64.50527954101562, -60.18719482421875, -55.86910629272461, -51.551021575927734, -47.232933044433594, -42.91484832763672, -38.596763610839844, -34.2786750793457, -29.960590362548828, -25.64250373840332, -21.324417114257812, -17.006330490112305, -12.688244819641113, -8.370159149169922, -4.052072525024414, 0.26601409912109375, 4.584098815917969, 8.902185440063477, 13.220272064208984, 17.538358688354492, 21.8564453125, 26.174530029296875, 30.492616653442383, 34.81070327758789, 39.128787994384766, 43.446876525878906, 47.76496124267578, 52.083045959472656, 56.4011344909668, 60.71921920776367, 65.03730773925781, 69.35539245605469, 73.67347717285156, 77.99156188964844, 82.30964660644531, 86.62773132324219, 90.94581604003906, 95.26390075683594, 99.58199310302734, 103.90007781982422, 108.2181625366211, 112.53624725341797, 116.85433959960938]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 18.0, 17.0, 30.0, 81.0, 105.0, 178.0, 289.0, 624.0, 1303.0, 2799.0, 7230.0, 21786.0, 89454.0, 2588881.0, 1368237.0, 81123.0, 19753.0, 6725.0, 2696.0, 1193.0, 675.0, 379.0, 229.0, 126.0, 101.0, 68.0, 58.0, 30.0, 21.0, 19.0, 12.0, 7.0, 8.0, 3.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.3125, -32.88134765625, -31.4501953125, -30.01904296875, -28.587890625, -27.15673828125, -25.7255859375, -24.29443359375, -22.86328125, -21.43212890625, -20.0009765625, -18.56982421875, -17.138671875, -15.70751953125, -14.2763671875, -12.84521484375, -11.4140625, -9.98291015625, -8.5517578125, -7.12060546875, -5.689453125, -4.25830078125, -2.8271484375, -1.39599609375, 0.03515625, 1.46630859375, 2.8974609375, 4.32861328125, 5.759765625, 7.19091796875, 8.6220703125, 10.05322265625, 11.484375, 12.91552734375, 14.3466796875, 15.77783203125, 17.208984375, 18.64013671875, 20.0712890625, 21.50244140625, 22.93359375, 24.36474609375, 25.7958984375, 27.22705078125, 28.658203125, 30.08935546875, 31.5205078125, 32.95166015625, 34.3828125, 35.81396484375, 37.2451171875, 38.67626953125, 40.107421875, 41.53857421875, 42.9697265625, 44.40087890625, 45.83203125, 47.26318359375, 48.6943359375, 50.12548828125, 51.556640625, 52.98779296875, 54.4189453125, 55.85009765625, 57.28125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 10.0, 16.0, 18.0, 32.0, 23.0, 40.0, 42.0, 50.0, 55.0, 72.0, 77.0, 68.0, 72.0, 76.0, 59.0, 67.0, 52.0, 36.0, 32.0, 25.0, 22.0, 15.0, 16.0, 3.0, 8.0, 6.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7109375, -5.490234375, -5.26953125, -5.048828125, -4.828125, -4.607421875, -4.38671875, -4.166015625, -3.9453125, -3.724609375, -3.50390625, -3.283203125, -3.0625, -2.841796875, -2.62109375, -2.400390625, -2.1796875, -1.958984375, -1.73828125, -1.517578125, -1.296875, -1.076171875, -0.85546875, -0.634765625, -0.4140625, -0.193359375, 0.02734375, 0.248046875, 0.46875, 0.689453125, 0.91015625, 1.130859375, 1.3515625, 1.572265625, 1.79296875, 2.013671875, 2.234375, 2.455078125, 2.67578125, 2.896484375, 3.1171875, 3.337890625, 3.55859375, 3.779296875, 4.0, 4.220703125, 4.44140625, 4.662109375, 4.8828125, 5.103515625, 5.32421875, 5.544921875, 5.765625, 5.986328125, 6.20703125, 6.427734375, 6.6484375, 6.869140625, 7.08984375, 7.310546875, 7.53125, 7.751953125, 7.97265625, 8.193359375, 8.4140625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 2.0, 9.0, 7.0, 6.0, 8.0, 14.0, 20.0, 30.0, 38.0, 53.0, 103.0, 202.0, 416.0, 743.0, 1496.0, 3320.0, 8956.0, 36495.0, 427768.0, 3587747.0, 100085.0, 17401.0, 5299.0, 2048.0, 900.0, 452.0, 261.0, 143.0, 88.0, 54.0, 32.0, 26.0, 16.0, 13.0, 7.0, 4.0, 4.0, 5.0, 5.0, 2.0, 2.0, 6.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-57.03125, -55.31591796875, -53.6005859375, -51.88525390625, -50.169921875, -48.45458984375, -46.7392578125, -45.02392578125, -43.30859375, -41.59326171875, -39.8779296875, -38.16259765625, -36.447265625, -34.73193359375, -33.0166015625, -31.30126953125, -29.5859375, -27.87060546875, -26.1552734375, -24.43994140625, -22.724609375, -21.00927734375, -19.2939453125, -17.57861328125, -15.86328125, -14.14794921875, -12.4326171875, -10.71728515625, -9.001953125, -7.28662109375, -5.5712890625, -3.85595703125, -2.140625, -0.42529296875, 1.2900390625, 3.00537109375, 4.720703125, 6.43603515625, 8.1513671875, 9.86669921875, 11.58203125, 13.29736328125, 15.0126953125, 16.72802734375, 18.443359375, 20.15869140625, 21.8740234375, 23.58935546875, 25.3046875, 27.02001953125, 28.7353515625, 30.45068359375, 32.166015625, 33.88134765625, 35.5966796875, 37.31201171875, 39.02734375, 40.74267578125, 42.4580078125, 44.17333984375, 45.888671875, 47.60400390625, 49.3193359375, 51.03466796875, 52.75]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 4.0, 6.0, 6.0, 10.0, 9.0, 14.0, 27.0, 38.0, 69.0, 122.0, 184.0, 450.0, 1767.0, 693.0, 284.0, 120.0, 82.0, 56.0, 39.0, 26.0, 15.0, 16.0, 7.0, 5.0, 4.0, 5.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.765625, -16.236572265625, -15.70751953125, -15.178466796875, -14.6494140625, -14.120361328125, -13.59130859375, -13.062255859375, -12.533203125, -12.004150390625, -11.47509765625, -10.946044921875, -10.4169921875, -9.887939453125, -9.35888671875, -8.829833984375, -8.30078125, -7.771728515625, -7.24267578125, -6.713623046875, -6.1845703125, -5.655517578125, -5.12646484375, -4.597412109375, -4.068359375, -3.539306640625, -3.01025390625, -2.481201171875, -1.9521484375, -1.423095703125, -0.89404296875, -0.364990234375, 0.1640625, 0.693115234375, 1.22216796875, 1.751220703125, 2.2802734375, 2.809326171875, 3.33837890625, 3.867431640625, 4.396484375, 4.925537109375, 5.45458984375, 5.983642578125, 6.5126953125, 7.041748046875, 7.57080078125, 8.099853515625, 8.62890625, 9.157958984375, 9.68701171875, 10.216064453125, 10.7451171875, 11.274169921875, 11.80322265625, 12.332275390625, 12.861328125, 13.390380859375, 13.91943359375, 14.448486328125, 14.9775390625, 15.506591796875, 16.03564453125, 16.564697265625, 17.09375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 24.0, 72.0, 197.0, 336.0, 218.0, 91.0, 34.0, 11.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-364.27911376953125, -357.0736083984375, -349.8681335449219, -342.6626281738281, -335.4571533203125, -328.25164794921875, -321.0461730957031, -313.8406677246094, -306.63519287109375, -299.4296875, -292.2242126464844, -285.0187072753906, -277.813232421875, -270.60772705078125, -263.4022521972656, -256.1967468261719, -248.99124145507812, -241.78575134277344, -234.58026123046875, -227.37477111816406, -220.16928100585938, -212.96377563476562, -205.75830078125, -198.55279541015625, -191.34732055664062, -184.14183044433594, -176.93634033203125, -169.73085021972656, -162.52536010742188, -155.31985473632812, -148.1143798828125, -140.90887451171875, -133.703369140625, -126.49787902832031, -119.29238891601562, -112.08689880371094, -104.88140106201172, -97.67591094970703, -90.47042083740234, -83.26492309570312, -76.0594482421875, -68.85395812988281, -61.64846420288086, -54.44297409057617, -47.23748016357422, -40.03199005126953, -32.826499938964844, -25.62100601196289, -18.415512084960938, -11.210020065307617, -4.004528999328613, 3.2009620666503906, 10.406454086303711, 17.61194610595703, 24.81743621826172, 32.02293014526367, 39.22842025756836, 46.43391036987305, 53.639404296875, 60.84489440917969, 68.05038452148438, 75.25587463378906, 82.46136474609375, 89.66686248779297, 96.87235260009766]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 7.0, 3.0, 11.0, 7.0, 19.0, 19.0, 14.0, 24.0, 30.0, 33.0, 35.0, 46.0, 48.0, 50.0, 54.0, 62.0, 55.0, 49.0, 54.0, 45.0, 50.0, 41.0, 44.0, 39.0, 32.0, 28.0, 23.0, 20.0, 20.0, 9.0, 8.0, 6.0, 8.0, 1.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.811527252197266, -49.83913803100586, -47.86674499511719, -45.89435577392578, -43.921966552734375, -41.94957733154297, -39.9771842956543, -38.00479507446289, -36.03240203857422, -34.06001281738281, -32.08761978149414, -30.115230560302734, -28.142841339111328, -26.17045021057129, -24.19805908203125, -22.225669860839844, -20.253280639648438, -18.2808895111084, -16.308500289916992, -14.336109161376953, -12.36371898651123, -10.391328811645508, -8.418937683105469, -6.446547508239746, -4.474157333374023, -2.5017669200897217, -0.5293765068054199, 1.443014144897461, 3.4154043197631836, 5.387794494628906, 7.360185623168945, 9.332575798034668, 11.304962158203125, 13.277352333068848, 15.24974250793457, 17.22213363647461, 19.194522857666016, 21.166913986206055, 23.139305114746094, 25.1116943359375, 27.08408546447754, 29.056476593017578, 31.028865814208984, 33.001258850097656, 34.97364807128906, 36.94603729248047, 38.918426513671875, 40.89081954956055, 42.86320877075195, 44.83559799194336, 46.80799102783203, 48.78038024902344, 50.752769470214844, 52.72515869140625, 54.69755172729492, 56.66994094848633, 58.642333984375, 60.614723205566406, 62.58711624145508, 64.55950927734375, 66.53189849853516, 68.50428771972656, 70.47667694091797, 72.44906616210938, 74.42145538330078]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 9.0, 8.0, 8.0, 14.0, 20.0, 22.0, 30.0, 46.0, 59.0, 69.0, 97.0, 131.0, 213.0, 277.0, 446.0, 765.0, 1342.0, 2352.0, 4951.0, 10823.0, 25352.0, 67195.0, 212340.0, 424509.0, 191600.0, 61604.0, 23743.0, 10132.0, 4752.0, 2378.0, 1296.0, 657.0, 429.0, 252.0, 192.0, 122.0, 81.0, 57.0, 44.0, 36.0, 28.0, 24.0, 15.0, 11.0, 9.0, 5.0, 6.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0], "bins": [-31.734375, -30.785888671875, -29.83740234375, -28.888916015625, -27.9404296875, -26.991943359375, -26.04345703125, -25.094970703125, -24.146484375, -23.197998046875, -22.24951171875, -21.301025390625, -20.3525390625, -19.404052734375, -18.45556640625, -17.507080078125, -16.55859375, -15.610107421875, -14.66162109375, -13.713134765625, -12.7646484375, -11.816162109375, -10.86767578125, -9.919189453125, -8.970703125, -8.022216796875, -7.07373046875, -6.125244140625, -5.1767578125, -4.228271484375, -3.27978515625, -2.331298828125, -1.3828125, -0.434326171875, 0.51416015625, 1.462646484375, 2.4111328125, 3.359619140625, 4.30810546875, 5.256591796875, 6.205078125, 7.153564453125, 8.10205078125, 9.050537109375, 9.9990234375, 10.947509765625, 11.89599609375, 12.844482421875, 13.79296875, 14.741455078125, 15.68994140625, 16.638427734375, 17.5869140625, 18.535400390625, 19.48388671875, 20.432373046875, 21.380859375, 22.329345703125, 23.27783203125, 24.226318359375, 25.1748046875, 26.123291015625, 27.07177734375, 28.020263671875, 28.96875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 6.0, 10.0, 11.0, 16.0, 16.0, 34.0, 45.0, 57.0, 67.0, 73.0, 86.0, 81.0, 85.0, 96.0, 70.0, 63.0, 59.0, 37.0, 26.0, 28.0, 16.0, 9.0, 8.0, 3.0, 0.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.921875, -7.65771484375, -7.3935546875, -7.12939453125, -6.865234375, -6.60107421875, -6.3369140625, -6.07275390625, -5.80859375, -5.54443359375, -5.2802734375, -5.01611328125, -4.751953125, -4.48779296875, -4.2236328125, -3.95947265625, -3.6953125, -3.43115234375, -3.1669921875, -2.90283203125, -2.638671875, -2.37451171875, -2.1103515625, -1.84619140625, -1.58203125, -1.31787109375, -1.0537109375, -0.78955078125, -0.525390625, -0.26123046875, 0.0029296875, 0.26708984375, 0.53125, 0.79541015625, 1.0595703125, 1.32373046875, 1.587890625, 1.85205078125, 2.1162109375, 2.38037109375, 2.64453125, 2.90869140625, 3.1728515625, 3.43701171875, 3.701171875, 3.96533203125, 4.2294921875, 4.49365234375, 4.7578125, 5.02197265625, 5.2861328125, 5.55029296875, 5.814453125, 6.07861328125, 6.3427734375, 6.60693359375, 6.87109375, 7.13525390625, 7.3994140625, 7.66357421875, 7.927734375, 8.19189453125, 8.4560546875, 8.72021484375, 8.984375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 3.0, 3.0, 13.0, 14.0, 26.0, 20.0, 35.0, 65.0, 84.0, 107.0, 163.0, 276.0, 435.0, 840.0, 1549.0, 3206.0, 8303.0, 24332.0, 81747.0, 297953.0, 432676.0, 136475.0, 38294.0, 12661.0, 4681.0, 1963.0, 1053.0, 564.0, 353.0, 214.0, 150.0, 94.0, 65.0, 44.0, 31.0, 15.0, 14.0, 11.0, 3.0, 2.0, 5.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.328125, -26.423095703125, -25.51806640625, -24.613037109375, -23.7080078125, -22.802978515625, -21.89794921875, -20.992919921875, -20.087890625, -19.182861328125, -18.27783203125, -17.372802734375, -16.4677734375, -15.562744140625, -14.65771484375, -13.752685546875, -12.84765625, -11.942626953125, -11.03759765625, -10.132568359375, -9.2275390625, -8.322509765625, -7.41748046875, -6.512451171875, -5.607421875, -4.702392578125, -3.79736328125, -2.892333984375, -1.9873046875, -1.082275390625, -0.17724609375, 0.727783203125, 1.6328125, 2.537841796875, 3.44287109375, 4.347900390625, 5.2529296875, 6.157958984375, 7.06298828125, 7.968017578125, 8.873046875, 9.778076171875, 10.68310546875, 11.588134765625, 12.4931640625, 13.398193359375, 14.30322265625, 15.208251953125, 16.11328125, 17.018310546875, 17.92333984375, 18.828369140625, 19.7333984375, 20.638427734375, 21.54345703125, 22.448486328125, 23.353515625, 24.258544921875, 25.16357421875, 26.068603515625, 26.9736328125, 27.878662109375, 28.78369140625, 29.688720703125, 30.59375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 12.0, 11.0, 10.0, 11.0, 15.0, 20.0, 22.0, 24.0, 26.0, 24.0, 26.0, 34.0, 40.0, 45.0, 47.0, 45.0, 45.0, 47.0, 51.0, 51.0, 39.0, 44.0, 47.0, 39.0, 31.0, 34.0, 31.0, 22.0, 25.0, 19.0, 13.0, 14.0, 9.0, 4.0, 3.0, 2.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-23.28125, -22.62744140625, -21.9736328125, -21.31982421875, -20.666015625, -20.01220703125, -19.3583984375, -18.70458984375, -18.05078125, -17.39697265625, -16.7431640625, -16.08935546875, -15.435546875, -14.78173828125, -14.1279296875, -13.47412109375, -12.8203125, -12.16650390625, -11.5126953125, -10.85888671875, -10.205078125, -9.55126953125, -8.8974609375, -8.24365234375, -7.58984375, -6.93603515625, -6.2822265625, -5.62841796875, -4.974609375, -4.32080078125, -3.6669921875, -3.01318359375, -2.359375, -1.70556640625, -1.0517578125, -0.39794921875, 0.255859375, 0.90966796875, 1.5634765625, 2.21728515625, 2.87109375, 3.52490234375, 4.1787109375, 4.83251953125, 5.486328125, 6.14013671875, 6.7939453125, 7.44775390625, 8.1015625, 8.75537109375, 9.4091796875, 10.06298828125, 10.716796875, 11.37060546875, 12.0244140625, 12.67822265625, 13.33203125, 13.98583984375, 14.6396484375, 15.29345703125, 15.947265625, 16.60107421875, 17.2548828125, 17.90869140625, 18.5625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 9.0, 18.0, 11.0, 23.0, 42.0, 81.0, 103.0, 191.0, 504.0, 1613.0, 7037.0, 67937.0, 895145.0, 66125.0, 7105.0, 1571.0, 502.0, 204.0, 132.0, 56.0, 51.0, 33.0, 20.0, 15.0, 6.0, 2.0, 4.0, 8.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.90625, -40.61669921875, -39.3271484375, -38.03759765625, -36.748046875, -35.45849609375, -34.1689453125, -32.87939453125, -31.58984375, -30.30029296875, -29.0107421875, -27.72119140625, -26.431640625, -25.14208984375, -23.8525390625, -22.56298828125, -21.2734375, -19.98388671875, -18.6943359375, -17.40478515625, -16.115234375, -14.82568359375, -13.5361328125, -12.24658203125, -10.95703125, -9.66748046875, -8.3779296875, -7.08837890625, -5.798828125, -4.50927734375, -3.2197265625, -1.93017578125, -0.640625, 0.64892578125, 1.9384765625, 3.22802734375, 4.517578125, 5.80712890625, 7.0966796875, 8.38623046875, 9.67578125, 10.96533203125, 12.2548828125, 13.54443359375, 14.833984375, 16.12353515625, 17.4130859375, 18.70263671875, 19.9921875, 21.28173828125, 22.5712890625, 23.86083984375, 25.150390625, 26.43994140625, 27.7294921875, 29.01904296875, 30.30859375, 31.59814453125, 32.8876953125, 34.17724609375, 35.466796875, 36.75634765625, 38.0458984375, 39.33544921875, 40.625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 1.0, 8.0, 6.0, 17.0, 23.0, 30.0, 33.0, 53.0, 94.0, 117.0, 138.0, 120.0, 87.0, 96.0, 61.0, 40.0, 26.0, 13.0, 14.0, 8.0, 6.0, 2.0, 0.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0026569366455078125, -0.0025461018085479736, -0.0024352669715881348, -0.002324432134628296, -0.002213597297668457, -0.002102762460708618, -0.0019919276237487793, -0.0018810927867889404, -0.0017702579498291016, -0.0016594231128692627, -0.0015485882759094238, -0.001437753438949585, -0.001326918601989746, -0.0012160837650299072, -0.0011052489280700684, -0.0009944140911102295, -0.0008835792541503906, -0.0007727444171905518, -0.0006619095802307129, -0.000551074743270874, -0.00044023990631103516, -0.0003294050693511963, -0.00021857023239135742, -0.00010773539543151855, 3.0994415283203125e-06, 0.00011393427848815918, 0.00022476911544799805, 0.0003356039524078369, 0.0004464387893676758, 0.0005572736263275146, 0.0006681084632873535, 0.0007789433002471924, 0.0008897781372070312, 0.0010006129741668701, 0.001111447811126709, 0.0012222826480865479, 0.0013331174850463867, 0.0014439523220062256, 0.0015547871589660645, 0.0016656219959259033, 0.0017764568328857422, 0.001887291669845581, 0.00199812650680542, 0.002108961343765259, 0.0022197961807250977, 0.0023306310176849365, 0.0024414658546447754, 0.0025523006916046143, 0.002663135528564453, 0.002773970365524292, 0.002884805202484131, 0.0029956400394439697, 0.0031064748764038086, 0.0032173097133636475, 0.0033281445503234863, 0.003438979387283325, 0.003549814224243164, 0.003660649061203003, 0.003771483898162842, 0.0038823187351226807, 0.0039931535720825195, 0.004103988409042358, 0.004214823246002197, 0.004325658082962036, 0.004436492919921875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 3.0, 4.0, 4.0, 6.0, 16.0, 21.0, 25.0, 48.0, 51.0, 86.0, 117.0, 182.0, 250.0, 455.0, 722.0, 1395.0, 2615.0, 5945.0, 16569.0, 86318.0, 631772.0, 253169.0, 31607.0, 8887.0, 3793.0, 1870.0, 992.0, 631.0, 360.0, 193.0, 142.0, 78.0, 88.0, 33.0, 27.0, 25.0, 22.0, 13.0, 7.0, 4.0, 1.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.328125, -20.731201171875, -20.13427734375, -19.537353515625, -18.9404296875, -18.343505859375, -17.74658203125, -17.149658203125, -16.552734375, -15.955810546875, -15.35888671875, -14.761962890625, -14.1650390625, -13.568115234375, -12.97119140625, -12.374267578125, -11.77734375, -11.180419921875, -10.58349609375, -9.986572265625, -9.3896484375, -8.792724609375, -8.19580078125, -7.598876953125, -7.001953125, -6.405029296875, -5.80810546875, -5.211181640625, -4.6142578125, -4.017333984375, -3.42041015625, -2.823486328125, -2.2265625, -1.629638671875, -1.03271484375, -0.435791015625, 0.1611328125, 0.758056640625, 1.35498046875, 1.951904296875, 2.548828125, 3.145751953125, 3.74267578125, 4.339599609375, 4.9365234375, 5.533447265625, 6.13037109375, 6.727294921875, 7.32421875, 7.921142578125, 8.51806640625, 9.114990234375, 9.7119140625, 10.308837890625, 10.90576171875, 11.502685546875, 12.099609375, 12.696533203125, 13.29345703125, 13.890380859375, 14.4873046875, 15.084228515625, 15.68115234375, 16.278076171875, 16.875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 8.0, 3.0, 2.0, 5.0, 8.0, 13.0, 15.0, 21.0, 39.0, 42.0, 60.0, 78.0, 99.0, 107.0, 124.0, 99.0, 81.0, 50.0, 36.0, 34.0, 22.0, 13.0, 5.0, 11.0, 6.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0859375, -13.5960693359375, -13.106201171875, -12.6163330078125, -12.12646484375, -11.6365966796875, -11.146728515625, -10.6568603515625, -10.1669921875, -9.6771240234375, -9.187255859375, -8.6973876953125, -8.20751953125, -7.7176513671875, -7.227783203125, -6.7379150390625, -6.248046875, -5.7581787109375, -5.268310546875, -4.7784423828125, -4.28857421875, -3.7987060546875, -3.308837890625, -2.8189697265625, -2.3291015625, -1.8392333984375, -1.349365234375, -0.8594970703125, -0.36962890625, 0.1202392578125, 0.610107421875, 1.0999755859375, 1.58984375, 2.0797119140625, 2.569580078125, 3.0594482421875, 3.54931640625, 4.0391845703125, 4.529052734375, 5.0189208984375, 5.5087890625, 5.9986572265625, 6.488525390625, 6.9783935546875, 7.46826171875, 7.9581298828125, 8.447998046875, 8.9378662109375, 9.427734375, 9.9176025390625, 10.407470703125, 10.8973388671875, 11.38720703125, 11.8770751953125, 12.366943359375, 12.8568115234375, 13.3466796875, 13.8365478515625, 14.326416015625, 14.8162841796875, 15.30615234375, 15.7960205078125, 16.285888671875, 16.7757568359375, 17.265625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 9.0, 18.0, 24.0, 64.0, 131.0, 199.0, 216.0, 154.0, 90.0, 40.0, 26.0, 13.0, 8.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-313.8121032714844, -304.3437805175781, -294.8754577636719, -285.4071350097656, -275.9388122558594, -266.4704895019531, -257.0021667480469, -247.53384399414062, -238.06552124023438, -228.59719848632812, -219.12887573242188, -209.66055297851562, -200.19223022460938, -190.72390747070312, -181.25558471679688, -171.78726196289062, -162.31893920898438, -152.85061645507812, -143.38229370117188, -133.91397094726562, -124.44564819335938, -114.97732543945312, -105.50900268554688, -96.04067993164062, -86.57235717773438, -77.10403442382812, -67.63571166992188, -58.167388916015625, -48.699066162109375, -39.230743408203125, -29.762420654296875, -20.294097900390625, -10.8258056640625, -1.35748291015625, 8.11083984375, 17.57916259765625, 27.0474853515625, 36.51580810546875, 45.984130859375, 55.45245361328125, 64.9207763671875, 74.38909912109375, 83.857421875, 93.32574462890625, 102.7940673828125, 112.26239013671875, 121.730712890625, 131.19903564453125, 140.6673583984375, 150.13568115234375, 159.60400390625, 169.07232666015625, 178.5406494140625, 188.00897216796875, 197.477294921875, 206.94561767578125, 216.4139404296875, 225.88226318359375, 235.3505859375, 244.81890869140625, 254.2872314453125, 263.75555419921875, 273.223876953125, 282.69219970703125, 292.1605224609375]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 12.0, 11.0, 14.0, 12.0, 16.0, 13.0, 31.0, 38.0, 27.0, 26.0, 30.0, 47.0, 39.0, 46.0, 39.0, 41.0, 50.0, 57.0, 47.0, 48.0, 52.0, 47.0, 41.0, 32.0, 27.0, 25.0, 22.0, 21.0, 20.0, 12.0, 17.0, 4.0, 3.0, 4.0, 2.0, 2.0, 7.0, 0.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.35302734375, -113.45863342285156, -109.56423950195312, -105.66983795166016, -101.77544403076172, -97.88105010986328, -93.98665618896484, -90.09225463867188, -86.19786071777344, -82.303466796875, -78.40907287597656, -74.5146713256836, -70.62027740478516, -66.72588348388672, -62.83148956298828, -58.93709182739258, -55.04269790649414, -51.1483039855957, -47.25390625, -43.35951232910156, -39.46511459350586, -35.57072067260742, -31.67632484436035, -27.78192901611328, -23.88753318786621, -19.99313735961914, -16.09874153137207, -12.204346656799316, -8.309950828552246, -4.415555953979492, -0.5211601257324219, 3.3732357025146484, 7.267631530761719, 11.162027359008789, 15.05642318725586, 18.950817108154297, 22.84521484375, 26.739608764648438, 30.634004592895508, 34.52840042114258, 38.42279815673828, 42.31719207763672, 46.21158981323242, 50.10598373413086, 54.00038146972656, 57.894775390625, 61.78916931152344, 65.68356323242188, 69.57795715332031, 73.47235107421875, 77.36674499511719, 81.26114654541016, 85.1555404663086, 89.04993438720703, 92.94432830810547, 96.83872985839844, 100.73312377929688, 104.62751770019531, 108.52191162109375, 112.41631317138672, 116.31070709228516, 120.2051010131836, 124.09949493408203, 127.993896484375, 131.88829040527344]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 3.0, 6.0, 3.0, 13.0, 9.0, 25.0, 39.0, 51.0, 92.0, 155.0, 285.0, 474.0, 888.0, 1666.0, 3752.0, 9356.0, 30403.0, 166523.0, 3759407.0, 172548.0, 31086.0, 9680.0, 3832.0, 1785.0, 927.0, 479.0, 290.0, 147.0, 130.0, 70.0, 55.0, 30.0, 21.0, 19.0, 13.0, 4.0, 6.0, 8.0, 4.0, 6.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.109375, -23.993896484375, -22.87841796875, -21.762939453125, -20.6474609375, -19.531982421875, -18.41650390625, -17.301025390625, -16.185546875, -15.070068359375, -13.95458984375, -12.839111328125, -11.7236328125, -10.608154296875, -9.49267578125, -8.377197265625, -7.26171875, -6.146240234375, -5.03076171875, -3.915283203125, -2.7998046875, -1.684326171875, -0.56884765625, 0.546630859375, 1.662109375, 2.777587890625, 3.89306640625, 5.008544921875, 6.1240234375, 7.239501953125, 8.35498046875, 9.470458984375, 10.5859375, 11.701416015625, 12.81689453125, 13.932373046875, 15.0478515625, 16.163330078125, 17.27880859375, 18.394287109375, 19.509765625, 20.625244140625, 21.74072265625, 22.856201171875, 23.9716796875, 25.087158203125, 26.20263671875, 27.318115234375, 28.43359375, 29.549072265625, 30.66455078125, 31.780029296875, 32.8955078125, 34.010986328125, 35.12646484375, 36.241943359375, 37.357421875, 38.472900390625, 39.58837890625, 40.703857421875, 41.8193359375, 42.934814453125, 44.05029296875, 45.165771484375, 46.28125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 8.0, 10.0, 5.0, 13.0, 22.0, 24.0, 32.0, 47.0, 43.0, 48.0, 63.0, 71.0, 72.0, 55.0, 71.0, 69.0, 66.0, 51.0, 61.0, 34.0, 37.0, 35.0, 16.0, 18.0, 6.0, 11.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.99609375, -5.76348876953125, -5.5308837890625, -5.29827880859375, -5.065673828125, -4.83306884765625, -4.6004638671875, -4.36785888671875, -4.13525390625, -3.90264892578125, -3.6700439453125, -3.43743896484375, -3.204833984375, -2.97222900390625, -2.7396240234375, -2.50701904296875, -2.2744140625, -2.04180908203125, -1.8092041015625, -1.57659912109375, -1.343994140625, -1.11138916015625, -0.8787841796875, -0.64617919921875, -0.41357421875, -0.18096923828125, 0.0516357421875, 0.28424072265625, 0.516845703125, 0.74945068359375, 0.9820556640625, 1.21466064453125, 1.447265625, 1.67987060546875, 1.9124755859375, 2.14508056640625, 2.377685546875, 2.61029052734375, 2.8428955078125, 3.07550048828125, 3.30810546875, 3.54071044921875, 3.7733154296875, 4.00592041015625, 4.238525390625, 4.47113037109375, 4.7037353515625, 4.93634033203125, 5.1689453125, 5.40155029296875, 5.6341552734375, 5.86676025390625, 6.099365234375, 6.33197021484375, 6.5645751953125, 6.79718017578125, 7.02978515625, 7.26239013671875, 7.4949951171875, 7.72760009765625, 7.960205078125, 8.19281005859375, 8.4254150390625, 8.65802001953125, 8.890625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 10.0, 5.0, 16.0, 15.0, 33.0, 38.0, 57.0, 108.0, 196.0, 383.0, 714.0, 1358.0, 3169.0, 7695.0, 23257.0, 99139.0, 2432202.0, 1502575.0, 89758.0, 20949.0, 6982.0, 2852.0, 1287.0, 671.0, 299.0, 211.0, 113.0, 58.0, 45.0, 32.0, 15.0, 6.0, 13.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-33.625, -32.6904296875, -31.755859375, -30.8212890625, -29.88671875, -28.9521484375, -28.017578125, -27.0830078125, -26.1484375, -25.2138671875, -24.279296875, -23.3447265625, -22.41015625, -21.4755859375, -20.541015625, -19.6064453125, -18.671875, -17.7373046875, -16.802734375, -15.8681640625, -14.93359375, -13.9990234375, -13.064453125, -12.1298828125, -11.1953125, -10.2607421875, -9.326171875, -8.3916015625, -7.45703125, -6.5224609375, -5.587890625, -4.6533203125, -3.71875, -2.7841796875, -1.849609375, -0.9150390625, 0.01953125, 0.9541015625, 1.888671875, 2.8232421875, 3.7578125, 4.6923828125, 5.626953125, 6.5615234375, 7.49609375, 8.4306640625, 9.365234375, 10.2998046875, 11.234375, 12.1689453125, 13.103515625, 14.0380859375, 14.97265625, 15.9072265625, 16.841796875, 17.7763671875, 18.7109375, 19.6455078125, 20.580078125, 21.5146484375, 22.44921875, 23.3837890625, 24.318359375, 25.2529296875, 26.1875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 1.0, 1.0, 6.0, 5.0, 10.0, 14.0, 18.0, 19.0, 35.0, 47.0, 56.0, 81.0, 130.0, 236.0, 585.0, 1854.0, 448.0, 209.0, 103.0, 65.0, 53.0, 26.0, 22.0, 9.0, 8.0, 3.0, 4.0, 7.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-13.2578125, -12.9215087890625, -12.585205078125, -12.2489013671875, -11.91259765625, -11.5762939453125, -11.239990234375, -10.9036865234375, -10.5673828125, -10.2310791015625, -9.894775390625, -9.5584716796875, -9.22216796875, -8.8858642578125, -8.549560546875, -8.2132568359375, -7.876953125, -7.5406494140625, -7.204345703125, -6.8680419921875, -6.53173828125, -6.1954345703125, -5.859130859375, -5.5228271484375, -5.1865234375, -4.8502197265625, -4.513916015625, -4.1776123046875, -3.84130859375, -3.5050048828125, -3.168701171875, -2.8323974609375, -2.49609375, -2.1597900390625, -1.823486328125, -1.4871826171875, -1.15087890625, -0.8145751953125, -0.478271484375, -0.1419677734375, 0.1943359375, 0.5306396484375, 0.866943359375, 1.2032470703125, 1.53955078125, 1.8758544921875, 2.212158203125, 2.5484619140625, 2.884765625, 3.2210693359375, 3.557373046875, 3.8936767578125, 4.22998046875, 4.5662841796875, 4.902587890625, 5.2388916015625, 5.5751953125, 5.9114990234375, 6.247802734375, 6.5841064453125, 6.92041015625, 7.2567138671875, 7.593017578125, 7.9293212890625, 8.265625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 9.0, 9.0, 13.0, 27.0, 89.0, 204.0, 305.0, 236.0, 78.0, 22.0, 9.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-211.45022583007812, -206.8256378173828, -202.20106506347656, -197.57647705078125, -192.951904296875, -188.3273162841797, -183.70274353027344, -179.07815551757812, -174.45358276367188, -169.82899475097656, -165.2044219970703, -160.579833984375, -155.95526123046875, -151.33067321777344, -146.7061004638672, -142.08151245117188, -137.45692443847656, -132.83233642578125, -128.207763671875, -123.58318328857422, -118.95860290527344, -114.33401489257812, -109.70943450927734, -105.08485412597656, -100.46027374267578, -95.835693359375, -91.21111297607422, -86.58653259277344, -81.96194458007812, -77.33737182617188, -72.71278381347656, -68.08820343017578, -63.46360778808594, -58.839027404785156, -54.214447021484375, -49.58986282348633, -44.96528244018555, -40.340702056884766, -35.71611785888672, -31.091537475585938, -26.466957092285156, -21.842376708984375, -17.21779441833496, -12.593213081359863, -7.968631744384766, -3.3440513610839844, 1.2805309295654297, 5.905113220214844, 10.529693603515625, 15.154274940490723, 19.77885627746582, 24.403438568115234, 29.028018951416016, 33.6525993347168, 38.277183532714844, 42.901763916015625, 47.526344299316406, 52.15092468261719, 56.77550506591797, 61.400089263916016, 66.02467346191406, 70.64924621582031, 75.27383422851562, 79.8984146118164, 84.52299499511719]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 3.0, 1.0, 10.0, 8.0, 19.0, 8.0, 13.0, 21.0, 21.0, 27.0, 37.0, 50.0, 55.0, 42.0, 55.0, 53.0, 54.0, 63.0, 42.0, 56.0, 57.0, 53.0, 43.0, 45.0, 28.0, 29.0, 30.0, 21.0, 14.0, 17.0, 9.0, 10.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.777191162109375, -44.41929626464844, -43.0614013671875, -41.70350646972656, -40.345611572265625, -38.98772048950195, -37.629825592041016, -36.27193069458008, -34.91403579711914, -33.5561408996582, -32.198246002197266, -30.84035301208496, -29.482458114624023, -28.124563217163086, -26.76667022705078, -25.408775329589844, -24.050880432128906, -22.69298553466797, -21.33509063720703, -19.977197647094727, -18.61930274963379, -17.26140785217285, -15.90351390838623, -14.54561996459961, -13.187725067138672, -11.829830169677734, -10.471936225891113, -9.114042282104492, -7.756147384643555, -6.398252964019775, -5.040358543395996, -3.682464599609375, -2.324573516845703, -0.9666790962219238, 0.39121532440185547, 1.7491097450256348, 3.107004165649414, 4.464898586273193, 5.822793006896973, 7.180686950683594, 8.538581848144531, 9.896476745605469, 11.25437068939209, 12.612264633178711, 13.970159530639648, 15.328054428100586, 16.68594741821289, 18.043842315673828, 19.401737213134766, 20.759632110595703, 22.11752700805664, 23.475419998168945, 24.833314895629883, 26.19120979309082, 27.549102783203125, 28.906997680664062, 30.264892578125, 31.622787475585938, 32.980682373046875, 34.33857727050781, 35.69647216796875, 37.05436325073242, 38.41225814819336, 39.7701530456543, 41.128047943115234]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 8.0, 9.0, 10.0, 27.0, 19.0, 41.0, 47.0, 81.0, 116.0, 147.0, 245.0, 387.0, 665.0, 1173.0, 2241.0, 4509.0, 9997.0, 22617.0, 59955.0, 185505.0, 414405.0, 225037.0, 72063.0, 27072.0, 11234.0, 5141.0, 2567.0, 1327.0, 697.0, 427.0, 276.0, 190.0, 80.0, 64.0, 45.0, 38.0, 25.0, 25.0, 9.0, 12.0, 7.0, 7.0, 3.0, 4.0, 3.0, 0.0, 1.0], "bins": [-38.375, -37.35400390625, -36.3330078125, -35.31201171875, -34.291015625, -33.27001953125, -32.2490234375, -31.22802734375, -30.20703125, -29.18603515625, -28.1650390625, -27.14404296875, -26.123046875, -25.10205078125, -24.0810546875, -23.06005859375, -22.0390625, -21.01806640625, -19.9970703125, -18.97607421875, -17.955078125, -16.93408203125, -15.9130859375, -14.89208984375, -13.87109375, -12.85009765625, -11.8291015625, -10.80810546875, -9.787109375, -8.76611328125, -7.7451171875, -6.72412109375, -5.703125, -4.68212890625, -3.6611328125, -2.64013671875, -1.619140625, -0.59814453125, 0.4228515625, 1.44384765625, 2.46484375, 3.48583984375, 4.5068359375, 5.52783203125, 6.548828125, 7.56982421875, 8.5908203125, 9.61181640625, 10.6328125, 11.65380859375, 12.6748046875, 13.69580078125, 14.716796875, 15.73779296875, 16.7587890625, 17.77978515625, 18.80078125, 19.82177734375, 20.8427734375, 21.86376953125, 22.884765625, 23.90576171875, 24.9267578125, 25.94775390625, 26.96875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 5.0, 8.0, 13.0, 11.0, 17.0, 37.0, 33.0, 37.0, 54.0, 66.0, 48.0, 62.0, 54.0, 96.0, 64.0, 70.0, 62.0, 58.0, 57.0, 40.0, 27.0, 21.0, 18.0, 12.0, 7.0, 9.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.859375, -5.6290283203125, -5.398681640625, -5.1683349609375, -4.93798828125, -4.7076416015625, -4.477294921875, -4.2469482421875, -4.0166015625, -3.7862548828125, -3.555908203125, -3.3255615234375, -3.09521484375, -2.8648681640625, -2.634521484375, -2.4041748046875, -2.173828125, -1.9434814453125, -1.713134765625, -1.4827880859375, -1.25244140625, -1.0220947265625, -0.791748046875, -0.5614013671875, -0.3310546875, -0.1007080078125, 0.129638671875, 0.3599853515625, 0.59033203125, 0.8206787109375, 1.051025390625, 1.2813720703125, 1.51171875, 1.7420654296875, 1.972412109375, 2.2027587890625, 2.43310546875, 2.6634521484375, 2.893798828125, 3.1241455078125, 3.3544921875, 3.5848388671875, 3.815185546875, 4.0455322265625, 4.27587890625, 4.5062255859375, 4.736572265625, 4.9669189453125, 5.197265625, 5.4276123046875, 5.657958984375, 5.8883056640625, 6.11865234375, 6.3489990234375, 6.579345703125, 6.8096923828125, 7.0400390625, 7.2703857421875, 7.500732421875, 7.7310791015625, 7.96142578125, 8.1917724609375, 8.422119140625, 8.6524658203125, 8.8828125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 5.0, 5.0, 10.0, 10.0, 10.0, 18.0, 29.0, 43.0, 61.0, 101.0, 143.0, 242.0, 381.0, 803.0, 1904.0, 5834.0, 24533.0, 169909.0, 667204.0, 146260.0, 22161.0, 5258.0, 1799.0, 777.0, 408.0, 210.0, 131.0, 94.0, 66.0, 36.0, 30.0, 21.0, 14.0, 16.0, 7.0, 6.0, 5.0, 1.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.59375, -40.984375, -39.375, -37.765625, -36.15625, -34.546875, -32.9375, -31.328125, -29.71875, -28.109375, -26.5, -24.890625, -23.28125, -21.671875, -20.0625, -18.453125, -16.84375, -15.234375, -13.625, -12.015625, -10.40625, -8.796875, -7.1875, -5.578125, -3.96875, -2.359375, -0.75, 0.859375, 2.46875, 4.078125, 5.6875, 7.296875, 8.90625, 10.515625, 12.125, 13.734375, 15.34375, 16.953125, 18.5625, 20.171875, 21.78125, 23.390625, 25.0, 26.609375, 28.21875, 29.828125, 31.4375, 33.046875, 34.65625, 36.265625, 37.875, 39.484375, 41.09375, 42.703125, 44.3125, 45.921875, 47.53125, 49.140625, 50.75, 52.359375, 53.96875, 55.578125, 57.1875, 58.796875, 60.40625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 0.0, 14.0, 8.0, 2.0, 8.0, 11.0, 11.0, 18.0, 29.0, 33.0, 30.0, 27.0, 44.0, 41.0, 51.0, 45.0, 47.0, 44.0, 52.0, 43.0, 58.0, 48.0, 48.0, 54.0, 26.0, 36.0, 34.0, 26.0, 15.0, 21.0, 21.0, 12.0, 11.0, 6.0, 6.0, 4.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.640625, -18.895751953125, -18.15087890625, -17.406005859375, -16.6611328125, -15.916259765625, -15.17138671875, -14.426513671875, -13.681640625, -12.936767578125, -12.19189453125, -11.447021484375, -10.7021484375, -9.957275390625, -9.21240234375, -8.467529296875, -7.72265625, -6.977783203125, -6.23291015625, -5.488037109375, -4.7431640625, -3.998291015625, -3.25341796875, -2.508544921875, -1.763671875, -1.018798828125, -0.27392578125, 0.470947265625, 1.2158203125, 1.960693359375, 2.70556640625, 3.450439453125, 4.1953125, 4.940185546875, 5.68505859375, 6.429931640625, 7.1748046875, 7.919677734375, 8.66455078125, 9.409423828125, 10.154296875, 10.899169921875, 11.64404296875, 12.388916015625, 13.1337890625, 13.878662109375, 14.62353515625, 15.368408203125, 16.11328125, 16.858154296875, 17.60302734375, 18.347900390625, 19.0927734375, 19.837646484375, 20.58251953125, 21.327392578125, 22.072265625, 22.817138671875, 23.56201171875, 24.306884765625, 25.0517578125, 25.796630859375, 26.54150390625, 27.286376953125, 28.03125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 3.0, 2.0, 5.0, 7.0, 11.0, 14.0, 15.0, 21.0, 36.0, 47.0, 85.0, 116.0, 184.0, 290.0, 561.0, 1095.0, 2235.0, 5622.0, 16068.0, 62776.0, 392457.0, 460983.0, 76102.0, 18398.0, 6205.0, 2536.0, 1169.0, 589.0, 353.0, 181.0, 129.0, 90.0, 57.0, 32.0, 26.0, 18.0, 11.0, 8.0, 3.0, 5.0, 5.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.515625, -17.0159912109375, -16.516357421875, -16.0167236328125, -15.51708984375, -15.0174560546875, -14.517822265625, -14.0181884765625, -13.5185546875, -13.0189208984375, -12.519287109375, -12.0196533203125, -11.52001953125, -11.0203857421875, -10.520751953125, -10.0211181640625, -9.521484375, -9.0218505859375, -8.522216796875, -8.0225830078125, -7.52294921875, -7.0233154296875, -6.523681640625, -6.0240478515625, -5.5244140625, -5.0247802734375, -4.525146484375, -4.0255126953125, -3.52587890625, -3.0262451171875, -2.526611328125, -2.0269775390625, -1.52734375, -1.0277099609375, -0.528076171875, -0.0284423828125, 0.47119140625, 0.9708251953125, 1.470458984375, 1.9700927734375, 2.4697265625, 2.9693603515625, 3.468994140625, 3.9686279296875, 4.46826171875, 4.9678955078125, 5.467529296875, 5.9671630859375, 6.466796875, 6.9664306640625, 7.466064453125, 7.9656982421875, 8.46533203125, 8.9649658203125, 9.464599609375, 9.9642333984375, 10.4638671875, 10.9635009765625, 11.463134765625, 11.9627685546875, 12.46240234375, 12.9620361328125, 13.461669921875, 13.9613037109375, 14.4609375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 4.0, 4.0, 9.0, 7.0, 9.0, 16.0, 15.0, 26.0, 31.0, 45.0, 83.0, 79.0, 93.0, 123.0, 101.0, 98.0, 57.0, 55.0, 44.0, 29.0, 17.0, 12.0, 16.0, 11.0, 3.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0034122467041015625, -0.003313213586807251, -0.0032141804695129395, -0.003115147352218628, -0.0030161142349243164, -0.002917081117630005, -0.0028180480003356934, -0.002719014883041382, -0.0026199817657470703, -0.002520948648452759, -0.0024219155311584473, -0.0023228824138641357, -0.0022238492965698242, -0.0021248161792755127, -0.002025783061981201, -0.0019267499446868896, -0.0018277168273925781, -0.0017286837100982666, -0.001629650592803955, -0.0015306174755096436, -0.001431584358215332, -0.0013325512409210205, -0.001233518123626709, -0.0011344850063323975, -0.001035451889038086, -0.0009364187717437744, -0.0008373856544494629, -0.0007383525371551514, -0.0006393194198608398, -0.0005402863025665283, -0.0004412531852722168, -0.0003422200679779053, -0.00024318695068359375, -0.00014415383338928223, -4.51207160949707e-05, 5.391240119934082e-05, 0.00015294551849365234, 0.00025197863578796387, 0.0003510117530822754, 0.0004500448703765869, 0.0005490779876708984, 0.00064811110496521, 0.0007471442222595215, 0.000846177339553833, 0.0009452104568481445, 0.001044243574142456, 0.0011432766914367676, 0.001242309808731079, 0.0013413429260253906, 0.0014403760433197021, 0.0015394091606140137, 0.0016384422779083252, 0.0017374753952026367, 0.0018365085124969482, 0.0019355416297912598, 0.0020345747470855713, 0.002133607864379883, 0.0022326409816741943, 0.002331674098968506, 0.0024307072162628174, 0.002529740333557129, 0.0026287734508514404, 0.002727806568145752, 0.0028268396854400635, 0.002925872802734375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 11.0, 3.0, 8.0, 14.0, 26.0, 61.0, 105.0, 239.0, 449.0, 1296.0, 5141.0, 66328.0, 915945.0, 52374.0, 4502.0, 1171.0, 450.0, 179.0, 98.0, 66.0, 29.0, 21.0, 6.0, 6.0, 7.0, 2.0, 5.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.0, -35.956787109375, -34.91357421875, -33.870361328125, -32.8271484375, -31.783935546875, -30.74072265625, -29.697509765625, -28.654296875, -27.611083984375, -26.56787109375, -25.524658203125, -24.4814453125, -23.438232421875, -22.39501953125, -21.351806640625, -20.30859375, -19.265380859375, -18.22216796875, -17.178955078125, -16.1357421875, -15.092529296875, -14.04931640625, -13.006103515625, -11.962890625, -10.919677734375, -9.87646484375, -8.833251953125, -7.7900390625, -6.746826171875, -5.70361328125, -4.660400390625, -3.6171875, -2.573974609375, -1.53076171875, -0.487548828125, 0.5556640625, 1.598876953125, 2.64208984375, 3.685302734375, 4.728515625, 5.771728515625, 6.81494140625, 7.858154296875, 8.9013671875, 9.944580078125, 10.98779296875, 12.031005859375, 13.07421875, 14.117431640625, 15.16064453125, 16.203857421875, 17.2470703125, 18.290283203125, 19.33349609375, 20.376708984375, 21.419921875, 22.463134765625, 23.50634765625, 24.549560546875, 25.5927734375, 26.635986328125, 27.67919921875, 28.722412109375, 29.765625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 10.0, 9.0, 14.0, 34.0, 53.0, 75.0, 78.0, 114.0, 119.0, 140.0, 96.0, 84.0, 57.0, 43.0, 20.0, 21.0, 16.0, 5.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.15625, -18.636962890625, -18.11767578125, -17.598388671875, -17.0791015625, -16.559814453125, -16.04052734375, -15.521240234375, -15.001953125, -14.482666015625, -13.96337890625, -13.444091796875, -12.9248046875, -12.405517578125, -11.88623046875, -11.366943359375, -10.84765625, -10.328369140625, -9.80908203125, -9.289794921875, -8.7705078125, -8.251220703125, -7.73193359375, -7.212646484375, -6.693359375, -6.174072265625, -5.65478515625, -5.135498046875, -4.6162109375, -4.096923828125, -3.57763671875, -3.058349609375, -2.5390625, -2.019775390625, -1.50048828125, -0.981201171875, -0.4619140625, 0.057373046875, 0.57666015625, 1.095947265625, 1.615234375, 2.134521484375, 2.65380859375, 3.173095703125, 3.6923828125, 4.211669921875, 4.73095703125, 5.250244140625, 5.76953125, 6.288818359375, 6.80810546875, 7.327392578125, 7.8466796875, 8.365966796875, 8.88525390625, 9.404541015625, 9.923828125, 10.443115234375, 10.96240234375, 11.481689453125, 12.0009765625, 12.520263671875, 13.03955078125, 13.558837890625, 14.078125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 11.0, 18.0, 31.0, 49.0, 89.0, 174.0, 254.0, 191.0, 91.0, 37.0, 25.0, 15.0, 9.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-319.599365234375, -307.93145751953125, -296.2635192871094, -284.5956115722656, -272.92767333984375, -261.259765625, -249.5918426513672, -237.92391967773438, -226.25599670410156, -214.58807373046875, -202.92015075683594, -191.25222778320312, -179.58432006835938, -167.9163818359375, -156.24847412109375, -144.58055114746094, -132.91262817382812, -121.24470520019531, -109.5767822265625, -97.90886688232422, -86.2409439086914, -74.5730209350586, -62.90510559082031, -51.2371826171875, -39.56925964355469, -27.901338577270508, -16.233417510986328, -4.565498352050781, 7.102424621582031, 18.770347595214844, 30.438262939453125, 42.10618591308594, 53.77410888671875, 65.44203186035156, 77.10995483398438, 88.77787017822266, 100.44579315185547, 112.11371612548828, 123.78163146972656, 135.44955444335938, 147.1174774169922, 158.785400390625, 170.4533233642578, 182.12124633789062, 193.78915405273438, 205.45709228515625, 217.125, 228.7929229736328, 240.46084594726562, 252.12876892089844, 263.79669189453125, 275.464599609375, 287.1325378417969, 298.8004455566406, 310.4683837890625, 322.13629150390625, 333.80419921875, 345.47210693359375, 357.1400451660156, 368.8079528808594, 380.47589111328125, 392.143798828125, 403.81170654296875, 415.4796447753906, 427.1475830078125]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 3.0, 3.0, 7.0, 7.0, 9.0, 3.0, 7.0, 7.0, 13.0, 28.0, 22.0, 12.0, 19.0, 24.0, 28.0, 34.0, 29.0, 34.0, 35.0, 46.0, 35.0, 36.0, 49.0, 44.0, 37.0, 40.0, 48.0, 41.0, 34.0, 24.0, 39.0, 22.0, 22.0, 24.0, 23.0, 21.0, 19.0, 7.0, 16.0, 7.0, 14.0, 5.0, 11.0, 8.0, 5.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.26374816894531, -118.38245391845703, -114.50115203857422, -110.61985778808594, -106.73856353759766, -102.85726165771484, -98.97596740722656, -95.09466552734375, -91.21337127685547, -87.33207702636719, -83.45077514648438, -79.5694808959961, -75.68818664550781, -71.806884765625, -67.92559051513672, -64.04429626464844, -60.16299819946289, -56.281700134277344, -52.40040588378906, -48.519107818603516, -44.63780975341797, -40.75651550292969, -36.87521743774414, -32.993919372558594, -29.11262321472168, -25.231327056884766, -21.35002899169922, -17.468732833862305, -13.587435722351074, -9.706138610839844, -5.82484245300293, -1.9435443878173828, 1.9377517700195312, 5.819048881530762, 9.700345993041992, 13.581642150878906, 17.462940216064453, 21.344236373901367, 25.22553253173828, 29.106830596923828, 32.988128662109375, 36.86942672729492, 40.7507209777832, 44.63201904296875, 48.5133171081543, 52.394615173339844, 56.275909423828125, 60.15720748901367, 64.03849792480469, 67.91979217529297, 71.80109405517578, 75.68238830566406, 79.56368255615234, 83.44498443603516, 87.32627868652344, 91.20758056640625, 95.08887481689453, 98.97016906738281, 102.85147094726562, 106.7327651977539, 110.61405944824219, 114.495361328125, 118.37665557861328, 122.25794982910156, 126.13925170898438]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 5.0, 4.0, 6.0, 12.0, 11.0, 23.0, 22.0, 39.0, 71.0, 82.0, 157.0, 204.0, 350.0, 558.0, 918.0, 1495.0, 2597.0, 4555.0, 8322.0, 17496.0, 45454.0, 186244.0, 3487867.0, 331018.0, 62411.0, 21837.0, 9853.0, 5153.0, 2908.0, 1681.0, 1050.0, 639.0, 446.0, 257.0, 176.0, 104.0, 83.0, 56.0, 40.0, 30.0, 10.0, 21.0, 5.0, 4.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.765625, -27.93505859375, -27.1044921875, -26.27392578125, -25.443359375, -24.61279296875, -23.7822265625, -22.95166015625, -22.12109375, -21.29052734375, -20.4599609375, -19.62939453125, -18.798828125, -17.96826171875, -17.1376953125, -16.30712890625, -15.4765625, -14.64599609375, -13.8154296875, -12.98486328125, -12.154296875, -11.32373046875, -10.4931640625, -9.66259765625, -8.83203125, -8.00146484375, -7.1708984375, -6.34033203125, -5.509765625, -4.67919921875, -3.8486328125, -3.01806640625, -2.1875, -1.35693359375, -0.5263671875, 0.30419921875, 1.134765625, 1.96533203125, 2.7958984375, 3.62646484375, 4.45703125, 5.28759765625, 6.1181640625, 6.94873046875, 7.779296875, 8.60986328125, 9.4404296875, 10.27099609375, 11.1015625, 11.93212890625, 12.7626953125, 13.59326171875, 14.423828125, 15.25439453125, 16.0849609375, 16.91552734375, 17.74609375, 18.57666015625, 19.4072265625, 20.23779296875, 21.068359375, 21.89892578125, 22.7294921875, 23.56005859375, 24.390625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 2.0, 4.0, 3.0, 8.0, 4.0, 11.0, 16.0, 17.0, 23.0, 20.0, 34.0, 34.0, 42.0, 41.0, 36.0, 39.0, 38.0, 55.0, 73.0, 53.0, 43.0, 67.0, 42.0, 45.0, 51.0, 31.0, 39.0, 21.0, 22.0, 17.0, 14.0, 20.0, 8.0, 7.0, 5.0, 5.0, 7.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.78125, -5.568359375, -5.35546875, -5.142578125, -4.9296875, -4.716796875, -4.50390625, -4.291015625, -4.078125, -3.865234375, -3.65234375, -3.439453125, -3.2265625, -3.013671875, -2.80078125, -2.587890625, -2.375, -2.162109375, -1.94921875, -1.736328125, -1.5234375, -1.310546875, -1.09765625, -0.884765625, -0.671875, -0.458984375, -0.24609375, -0.033203125, 0.1796875, 0.392578125, 0.60546875, 0.818359375, 1.03125, 1.244140625, 1.45703125, 1.669921875, 1.8828125, 2.095703125, 2.30859375, 2.521484375, 2.734375, 2.947265625, 3.16015625, 3.373046875, 3.5859375, 3.798828125, 4.01171875, 4.224609375, 4.4375, 4.650390625, 4.86328125, 5.076171875, 5.2890625, 5.501953125, 5.71484375, 5.927734375, 6.140625, 6.353515625, 6.56640625, 6.779296875, 6.9921875, 7.205078125, 7.41796875, 7.630859375, 7.84375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 8.0, 13.0, 19.0, 17.0, 28.0, 42.0, 53.0, 79.0, 120.0, 203.0, 385.0, 1008.0, 2553.0, 8004.0, 31218.0, 215581.0, 3685901.0, 207250.0, 29991.0, 7620.0, 2378.0, 898.0, 360.0, 204.0, 126.0, 68.0, 44.0, 35.0, 22.0, 17.0, 13.0, 9.0, 7.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.03125, -36.74169921875, -35.4521484375, -34.16259765625, -32.873046875, -31.58349609375, -30.2939453125, -29.00439453125, -27.71484375, -26.42529296875, -25.1357421875, -23.84619140625, -22.556640625, -21.26708984375, -19.9775390625, -18.68798828125, -17.3984375, -16.10888671875, -14.8193359375, -13.52978515625, -12.240234375, -10.95068359375, -9.6611328125, -8.37158203125, -7.08203125, -5.79248046875, -4.5029296875, -3.21337890625, -1.923828125, -0.63427734375, 0.6552734375, 1.94482421875, 3.234375, 4.52392578125, 5.8134765625, 7.10302734375, 8.392578125, 9.68212890625, 10.9716796875, 12.26123046875, 13.55078125, 14.84033203125, 16.1298828125, 17.41943359375, 18.708984375, 19.99853515625, 21.2880859375, 22.57763671875, 23.8671875, 25.15673828125, 26.4462890625, 27.73583984375, 29.025390625, 30.31494140625, 31.6044921875, 32.89404296875, 34.18359375, 35.47314453125, 36.7626953125, 38.05224609375, 39.341796875, 40.63134765625, 41.9208984375, 43.21044921875, 44.5]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 11.0, 11.0, 13.0, 19.0, 15.0, 28.0, 45.0, 77.0, 131.0, 244.0, 695.0, 1816.0, 466.0, 194.0, 91.0, 72.0, 46.0, 27.0, 24.0, 18.0, 10.0, 5.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0], "bins": [-24.453125, -23.9366455078125, -23.420166015625, -22.9036865234375, -22.38720703125, -21.8707275390625, -21.354248046875, -20.8377685546875, -20.3212890625, -19.8048095703125, -19.288330078125, -18.7718505859375, -18.25537109375, -17.7388916015625, -17.222412109375, -16.7059326171875, -16.189453125, -15.6729736328125, -15.156494140625, -14.6400146484375, -14.12353515625, -13.6070556640625, -13.090576171875, -12.5740966796875, -12.0576171875, -11.5411376953125, -11.024658203125, -10.5081787109375, -9.99169921875, -9.4752197265625, -8.958740234375, -8.4422607421875, -7.92578125, -7.4093017578125, -6.892822265625, -6.3763427734375, -5.85986328125, -5.3433837890625, -4.826904296875, -4.3104248046875, -3.7939453125, -3.2774658203125, -2.760986328125, -2.2445068359375, -1.72802734375, -1.2115478515625, -0.695068359375, -0.1785888671875, 0.337890625, 0.8543701171875, 1.370849609375, 1.8873291015625, 2.40380859375, 2.9202880859375, 3.436767578125, 3.9532470703125, 4.4697265625, 4.9862060546875, 5.502685546875, 6.0191650390625, 6.53564453125, 7.0521240234375, 7.568603515625, 8.0850830078125, 8.6015625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 4.0, 8.0, 16.0, 35.0, 49.0, 98.0, 166.0, 215.0, 168.0, 104.0, 57.0, 35.0, 18.0, 8.0, 8.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-141.2550048828125, -137.31082153320312, -133.3666534423828, -129.42247009277344, -125.47828674316406, -121.53411102294922, -117.58993530273438, -113.645751953125, -109.70157623291016, -105.75740051269531, -101.81321716308594, -97.8690414428711, -93.92486572265625, -89.98068237304688, -86.03650665283203, -82.09233093261719, -78.14814758300781, -74.20397186279297, -70.2597885131836, -66.31561279296875, -62.37143325805664, -58.42725372314453, -54.48307800292969, -50.53889846801758, -46.59471893310547, -42.65053939819336, -38.70635986328125, -34.762184143066406, -30.818004608154297, -26.873825073242188, -22.92964744567871, -18.985469818115234, -15.041297912597656, -11.097119331359863, -7.15294075012207, -3.2087621688842773, 0.7354164123535156, 4.679595947265625, 8.623773574829102, 12.567951202392578, 16.512130737304688, 20.456310272216797, 24.400487899780273, 28.34466552734375, 32.28884506225586, 36.23302459716797, 40.17720031738281, 44.12137985229492, 48.06555938720703, 52.00973892211914, 55.95391845703125, 59.898094177246094, 63.8422737121582, 67.78645324707031, 71.73062896728516, 75.6748046875, 79.61898803710938, 83.56316375732422, 87.5073471069336, 91.45152282714844, 95.39570617675781, 99.33988189697266, 103.2840576171875, 107.22824096679688, 111.17241668701172]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 6.0, 6.0, 19.0, 11.0, 22.0, 24.0, 26.0, 30.0, 32.0, 45.0, 41.0, 33.0, 52.0, 50.0, 57.0, 50.0, 48.0, 46.0, 51.0, 42.0, 48.0, 39.0, 37.0, 31.0, 24.0, 25.0, 20.0, 17.0, 19.0, 14.0, 11.0, 8.0, 8.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.7086181640625, -46.08142852783203, -44.4542350769043, -42.82704162597656, -41.199851989746094, -39.572662353515625, -37.94546890258789, -36.318275451660156, -34.69108581542969, -33.06389617919922, -31.436702728271484, -29.809511184692383, -28.18231964111328, -26.55512809753418, -24.927936553955078, -23.300745010375977, -21.673553466796875, -20.046361923217773, -18.419170379638672, -16.79197883605957, -15.164787292480469, -13.537595748901367, -11.910404205322266, -10.283212661743164, -8.656021118164062, -7.028829574584961, -5.401638031005859, -3.774446487426758, -2.1472549438476562, -0.5200634002685547, 1.1071281433105469, 2.7343196868896484, 4.361507415771484, 5.988698959350586, 7.6158905029296875, 9.243082046508789, 10.87027359008789, 12.497465133666992, 14.124656677246094, 15.751848220825195, 17.379039764404297, 19.0062313079834, 20.6334228515625, 22.2606143951416, 23.887805938720703, 25.514997482299805, 27.142189025878906, 28.769380569458008, 30.39657211303711, 32.023765563964844, 33.65095520019531, 35.27814483642578, 36.905338287353516, 38.53253173828125, 40.15972137451172, 41.78691101074219, 43.41410446166992, 45.041297912597656, 46.668487548828125, 48.295677185058594, 49.92287063598633, 51.55006408691406, 53.17725372314453, 54.804443359375, 56.431636810302734]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 6.0, 4.0, 3.0, 5.0, 19.0, 20.0, 23.0, 43.0, 44.0, 65.0, 114.0, 171.0, 245.0, 358.0, 654.0, 1013.0, 1589.0, 2705.0, 4756.0, 8848.0, 16634.0, 34211.0, 76902.0, 195841.0, 392497.0, 175362.0, 69872.0, 31669.0, 15430.0, 8259.0, 4535.0, 2580.0, 1499.0, 946.0, 596.0, 350.0, 234.0, 155.0, 75.0, 73.0, 48.0, 30.0, 25.0, 21.0, 9.0, 7.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-29.46875, -28.587646484375, -27.70654296875, -26.825439453125, -25.9443359375, -25.063232421875, -24.18212890625, -23.301025390625, -22.419921875, -21.538818359375, -20.65771484375, -19.776611328125, -18.8955078125, -18.014404296875, -17.13330078125, -16.252197265625, -15.37109375, -14.489990234375, -13.60888671875, -12.727783203125, -11.8466796875, -10.965576171875, -10.08447265625, -9.203369140625, -8.322265625, -7.441162109375, -6.56005859375, -5.678955078125, -4.7978515625, -3.916748046875, -3.03564453125, -2.154541015625, -1.2734375, -0.392333984375, 0.48876953125, 1.369873046875, 2.2509765625, 3.132080078125, 4.01318359375, 4.894287109375, 5.775390625, 6.656494140625, 7.53759765625, 8.418701171875, 9.2998046875, 10.180908203125, 11.06201171875, 11.943115234375, 12.82421875, 13.705322265625, 14.58642578125, 15.467529296875, 16.3486328125, 17.229736328125, 18.11083984375, 18.991943359375, 19.873046875, 20.754150390625, 21.63525390625, 22.516357421875, 23.3974609375, 24.278564453125, 25.15966796875, 26.040771484375, 26.921875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 7.0, 4.0, 13.0, 11.0, 11.0, 20.0, 24.0, 34.0, 33.0, 32.0, 36.0, 45.0, 46.0, 58.0, 48.0, 54.0, 55.0, 52.0, 47.0, 63.0, 55.0, 47.0, 41.0, 31.0, 15.0, 30.0, 19.0, 12.0, 16.0, 16.0, 8.0, 3.0, 2.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.00390625, -5.77630615234375, -5.5487060546875, -5.32110595703125, -5.093505859375, -4.86590576171875, -4.6383056640625, -4.41070556640625, -4.18310546875, -3.95550537109375, -3.7279052734375, -3.50030517578125, -3.272705078125, -3.04510498046875, -2.8175048828125, -2.58990478515625, -2.3623046875, -2.13470458984375, -1.9071044921875, -1.67950439453125, -1.451904296875, -1.22430419921875, -0.9967041015625, -0.76910400390625, -0.54150390625, -0.31390380859375, -0.0863037109375, 0.14129638671875, 0.368896484375, 0.59649658203125, 0.8240966796875, 1.05169677734375, 1.279296875, 1.50689697265625, 1.7344970703125, 1.96209716796875, 2.189697265625, 2.41729736328125, 2.6448974609375, 2.87249755859375, 3.10009765625, 3.32769775390625, 3.5552978515625, 3.78289794921875, 4.010498046875, 4.23809814453125, 4.4656982421875, 4.69329833984375, 4.9208984375, 5.14849853515625, 5.3760986328125, 5.60369873046875, 5.831298828125, 6.05889892578125, 6.2864990234375, 6.51409912109375, 6.74169921875, 6.96929931640625, 7.1968994140625, 7.42449951171875, 7.652099609375, 7.87969970703125, 8.1072998046875, 8.33489990234375, 8.5625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 1.0, 7.0, 7.0, 5.0, 8.0, 14.0, 14.0, 28.0, 25.0, 36.0, 51.0, 97.0, 128.0, 191.0, 355.0, 681.0, 1421.0, 3532.0, 11861.0, 56820.0, 462506.0, 439589.0, 53361.0, 11222.0, 3557.0, 1451.0, 643.0, 362.0, 199.0, 123.0, 75.0, 57.0, 41.0, 27.0, 21.0, 8.0, 9.0, 11.0, 1.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.5, -52.7412109375, -50.982421875, -49.2236328125, -47.46484375, -45.7060546875, -43.947265625, -42.1884765625, -40.4296875, -38.6708984375, -36.912109375, -35.1533203125, -33.39453125, -31.6357421875, -29.876953125, -28.1181640625, -26.359375, -24.6005859375, -22.841796875, -21.0830078125, -19.32421875, -17.5654296875, -15.806640625, -14.0478515625, -12.2890625, -10.5302734375, -8.771484375, -7.0126953125, -5.25390625, -3.4951171875, -1.736328125, 0.0224609375, 1.78125, 3.5400390625, 5.298828125, 7.0576171875, 8.81640625, 10.5751953125, 12.333984375, 14.0927734375, 15.8515625, 17.6103515625, 19.369140625, 21.1279296875, 22.88671875, 24.6455078125, 26.404296875, 28.1630859375, 29.921875, 31.6806640625, 33.439453125, 35.1982421875, 36.95703125, 38.7158203125, 40.474609375, 42.2333984375, 43.9921875, 45.7509765625, 47.509765625, 49.2685546875, 51.02734375, 52.7861328125, 54.544921875, 56.3037109375, 58.0625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 6.0, 1.0, 2.0, 10.0, 5.0, 8.0, 5.0, 9.0, 13.0, 13.0, 21.0, 19.0, 27.0, 42.0, 38.0, 44.0, 43.0, 53.0, 37.0, 58.0, 51.0, 55.0, 52.0, 65.0, 45.0, 45.0, 34.0, 44.0, 29.0, 30.0, 24.0, 21.0, 13.0, 6.0, 11.0, 7.0, 7.0, 2.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.546875, -28.6259765625, -27.705078125, -26.7841796875, -25.86328125, -24.9423828125, -24.021484375, -23.1005859375, -22.1796875, -21.2587890625, -20.337890625, -19.4169921875, -18.49609375, -17.5751953125, -16.654296875, -15.7333984375, -14.8125, -13.8916015625, -12.970703125, -12.0498046875, -11.12890625, -10.2080078125, -9.287109375, -8.3662109375, -7.4453125, -6.5244140625, -5.603515625, -4.6826171875, -3.76171875, -2.8408203125, -1.919921875, -0.9990234375, -0.078125, 0.8427734375, 1.763671875, 2.6845703125, 3.60546875, 4.5263671875, 5.447265625, 6.3681640625, 7.2890625, 8.2099609375, 9.130859375, 10.0517578125, 10.97265625, 11.8935546875, 12.814453125, 13.7353515625, 14.65625, 15.5771484375, 16.498046875, 17.4189453125, 18.33984375, 19.2607421875, 20.181640625, 21.1025390625, 22.0234375, 22.9443359375, 23.865234375, 24.7861328125, 25.70703125, 26.6279296875, 27.548828125, 28.4697265625, 29.390625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 10.0, 16.0, 37.0, 47.0, 73.0, 151.0, 313.0, 845.0, 3744.0, 59929.0, 969348.0, 11291.0, 1757.0, 501.0, 205.0, 114.0, 63.0, 42.0, 23.0, 18.0, 11.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-114.875, -111.3154296875, -107.755859375, -104.1962890625, -100.63671875, -97.0771484375, -93.517578125, -89.9580078125, -86.3984375, -82.8388671875, -79.279296875, -75.7197265625, -72.16015625, -68.6005859375, -65.041015625, -61.4814453125, -57.921875, -54.3623046875, -50.802734375, -47.2431640625, -43.68359375, -40.1240234375, -36.564453125, -33.0048828125, -29.4453125, -25.8857421875, -22.326171875, -18.7666015625, -15.20703125, -11.6474609375, -8.087890625, -4.5283203125, -0.96875, 2.5908203125, 6.150390625, 9.7099609375, 13.26953125, 16.8291015625, 20.388671875, 23.9482421875, 27.5078125, 31.0673828125, 34.626953125, 38.1865234375, 41.74609375, 45.3056640625, 48.865234375, 52.4248046875, 55.984375, 59.5439453125, 63.103515625, 66.6630859375, 70.22265625, 73.7822265625, 77.341796875, 80.9013671875, 84.4609375, 88.0205078125, 91.580078125, 95.1396484375, 98.69921875, 102.2587890625, 105.818359375, 109.3779296875, 112.9375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 10.0, 16.0, 35.0, 105.0, 466.0, 273.0, 64.0, 17.0, 9.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02197265625, -0.02152228355407715, -0.021071910858154297, -0.020621538162231445, -0.020171165466308594, -0.019720792770385742, -0.01927042007446289, -0.01882004737854004, -0.018369674682617188, -0.017919301986694336, -0.017468929290771484, -0.017018556594848633, -0.01656818389892578, -0.01611781120300293, -0.015667438507080078, -0.015217065811157227, -0.014766693115234375, -0.014316320419311523, -0.013865947723388672, -0.01341557502746582, -0.012965202331542969, -0.012514829635620117, -0.012064456939697266, -0.011614084243774414, -0.011163711547851562, -0.010713338851928711, -0.01026296615600586, -0.009812593460083008, -0.009362220764160156, -0.008911848068237305, -0.008461475372314453, -0.008011102676391602, -0.00756072998046875, -0.0071103572845458984, -0.006659984588623047, -0.006209611892700195, -0.005759239196777344, -0.005308866500854492, -0.004858493804931641, -0.004408121109008789, -0.0039577484130859375, -0.003507375717163086, -0.0030570030212402344, -0.002606630325317383, -0.0021562576293945312, -0.0017058849334716797, -0.0012555122375488281, -0.0008051395416259766, -0.000354766845703125, 9.560585021972656e-05, 0.0005459785461425781, 0.0009963512420654297, 0.0014467239379882812, 0.0018970966339111328, 0.0023474693298339844, 0.002797842025756836, 0.0032482147216796875, 0.003698587417602539, 0.004148960113525391, 0.004599332809448242, 0.005049705505371094, 0.005500078201293945, 0.005950450897216797, 0.0064008235931396484, 0.0068511962890625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 9.0, 4.0, 14.0, 21.0, 19.0, 41.0, 66.0, 103.0, 226.0, 494.0, 1975.0, 16018.0, 1011159.0, 15479.0, 1913.0, 519.0, 215.0, 111.0, 59.0, 47.0, 28.0, 14.0, 5.0, 4.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-141.5, -137.513671875, -133.52734375, -129.541015625, -125.5546875, -121.568359375, -117.58203125, -113.595703125, -109.609375, -105.623046875, -101.63671875, -97.650390625, -93.6640625, -89.677734375, -85.69140625, -81.705078125, -77.71875, -73.732421875, -69.74609375, -65.759765625, -61.7734375, -57.787109375, -53.80078125, -49.814453125, -45.828125, -41.841796875, -37.85546875, -33.869140625, -29.8828125, -25.896484375, -21.91015625, -17.923828125, -13.9375, -9.951171875, -5.96484375, -1.978515625, 2.0078125, 5.994140625, 9.98046875, 13.966796875, 17.953125, 21.939453125, 25.92578125, 29.912109375, 33.8984375, 37.884765625, 41.87109375, 45.857421875, 49.84375, 53.830078125, 57.81640625, 61.802734375, 65.7890625, 69.775390625, 73.76171875, 77.748046875, 81.734375, 85.720703125, 89.70703125, 93.693359375, 97.6796875, 101.666015625, 105.65234375, 109.638671875, 113.625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 54.0, 142.0, 396.0, 256.0, 95.0, 26.0, 6.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.5625, -78.24609375, -75.9296875, -73.61328125, -71.296875, -68.98046875, -66.6640625, -64.34765625, -62.03125, -59.71484375, -57.3984375, -55.08203125, -52.765625, -50.44921875, -48.1328125, -45.81640625, -43.5, -41.18359375, -38.8671875, -36.55078125, -34.234375, -31.91796875, -29.6015625, -27.28515625, -24.96875, -22.65234375, -20.3359375, -18.01953125, -15.703125, -13.38671875, -11.0703125, -8.75390625, -6.4375, -4.12109375, -1.8046875, 0.51171875, 2.828125, 5.14453125, 7.4609375, 9.77734375, 12.09375, 14.41015625, 16.7265625, 19.04296875, 21.359375, 23.67578125, 25.9921875, 28.30859375, 30.625, 32.94140625, 35.2578125, 37.57421875, 39.890625, 42.20703125, 44.5234375, 46.83984375, 49.15625, 51.47265625, 53.7890625, 56.10546875, 58.421875, 60.73828125, 63.0546875, 65.37109375, 67.6875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 3.0, 12.0, 14.0, 31.0, 115.0, 226.0, 300.0, 185.0, 75.0, 29.0, 10.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-237.8754119873047, -215.21688842773438, -192.55836486816406, -169.89984130859375, -147.2413330078125, -124.58280181884766, -101.92428588867188, -79.26576232910156, -56.60723876953125, -33.94871520996094, -11.29019546508789, 11.368324279785156, 34.02684783935547, 56.68537139892578, 79.34388732910156, 102.00241088867188, 124.66093444824219, 147.3194580078125, 169.9779815673828, 192.63650512695312, 215.29501342773438, 237.95355224609375, 260.612060546875, 283.27056884765625, 305.9291076660156, 328.5876159667969, 351.24615478515625, 373.9046630859375, 396.5632019042969, 419.2217102050781, 441.8802490234375, 464.53875732421875, 487.19732666015625, 509.8558349609375, 532.5143432617188, 555.1729125976562, 577.8314208984375, 600.4899291992188, 623.1484375, 645.8070068359375, 668.4655151367188, 691.1240234375, 713.7825317382812, 736.4411010742188, 759.099609375, 781.7581176757812, 804.4166259765625, 827.0751953125, 849.733642578125, 872.3921508789062, 895.0506591796875, 917.709228515625, 940.3677368164062, 963.0262451171875, 985.6847534179688, 1008.34326171875, 1031.0018310546875, 1053.660400390625, 1076.31884765625, 1098.9774169921875, 1121.6358642578125, 1144.29443359375, 1166.9530029296875, 1189.6114501953125, 1212.27001953125]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 6.0, 2.0, 4.0, 6.0, 5.0, 2.0, 11.0, 9.0, 12.0, 23.0, 17.0, 24.0, 26.0, 20.0, 29.0, 28.0, 33.0, 37.0, 31.0, 37.0, 41.0, 35.0, 33.0, 46.0, 33.0, 48.0, 46.0, 33.0, 40.0, 36.0, 30.0, 32.0, 29.0, 17.0, 22.0, 21.0, 18.0, 15.0, 10.0, 21.0, 9.0, 7.0, 3.0, 5.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-164.11663818359375, -159.47264099121094, -154.82864379882812, -150.1846466064453, -145.5406494140625, -140.8966522216797, -136.25265502929688, -131.60865783691406, -126.96466064453125, -122.32066345214844, -117.67666625976562, -113.03266906738281, -108.388671875, -103.74467468261719, -99.10067749023438, -94.45668029785156, -89.81268310546875, -85.16868591308594, -80.52468872070312, -75.88069152832031, -71.2366943359375, -66.59269714355469, -61.948699951171875, -57.30470275878906, -52.66070556640625, -48.01670837402344, -43.372711181640625, -38.72871398925781, -34.084716796875, -29.440719604492188, -24.796722412109375, -20.152725219726562, -15.508712768554688, -10.864715576171875, -6.2207183837890625, -1.57672119140625, 3.0672760009765625, 7.711273193359375, 12.355270385742188, 16.999267578125, 21.643264770507812, 26.287261962890625, 30.931259155273438, 35.57525634765625, 40.21925354003906, 44.863250732421875, 49.50724792480469, 54.1512451171875, 58.79524230957031, 63.439239501953125, 68.08323669433594, 72.72723388671875, 77.37123107910156, 82.01522827148438, 86.65922546386719, 91.30322265625, 95.94721984863281, 100.59121704101562, 105.23521423339844, 109.87921142578125, 114.52320861816406, 119.16720581054688, 123.81120300292969, 128.4552001953125, 133.0991973876953]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 7.0, 6.0, 13.0, 17.0, 27.0, 34.0, 60.0, 115.0, 174.0, 340.0, 632.0, 1192.0, 2267.0, 5254.0, 14287.0, 59231.0, 3788373.0, 274520.0, 31187.0, 9184.0, 3709.0, 1658.0, 913.0, 506.0, 250.0, 128.0, 84.0, 33.0, 27.0, 30.0, 8.0, 11.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.5625, -52.89892578125, -51.2353515625, -49.57177734375, -47.908203125, -46.24462890625, -44.5810546875, -42.91748046875, -41.25390625, -39.59033203125, -37.9267578125, -36.26318359375, -34.599609375, -32.93603515625, -31.2724609375, -29.60888671875, -27.9453125, -26.28173828125, -24.6181640625, -22.95458984375, -21.291015625, -19.62744140625, -17.9638671875, -16.30029296875, -14.63671875, -12.97314453125, -11.3095703125, -9.64599609375, -7.982421875, -6.31884765625, -4.6552734375, -2.99169921875, -1.328125, 0.33544921875, 1.9990234375, 3.66259765625, 5.326171875, 6.98974609375, 8.6533203125, 10.31689453125, 11.98046875, 13.64404296875, 15.3076171875, 16.97119140625, 18.634765625, 20.29833984375, 21.9619140625, 23.62548828125, 25.2890625, 26.95263671875, 28.6162109375, 30.27978515625, 31.943359375, 33.60693359375, 35.2705078125, 36.93408203125, 38.59765625, 40.26123046875, 41.9248046875, 43.58837890625, 45.251953125, 46.91552734375, 48.5791015625, 50.24267578125, 51.90625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 6.0, 5.0, 9.0, 9.0, 5.0, 18.0, 22.0, 20.0, 17.0, 30.0, 32.0, 44.0, 48.0, 45.0, 44.0, 39.0, 51.0, 48.0, 52.0, 51.0, 52.0, 37.0, 54.0, 35.0, 38.0, 34.0, 30.0, 28.0, 22.0, 18.0, 18.0, 11.0, 8.0, 7.0, 3.0, 2.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.53515625, -6.29364013671875, -6.0521240234375, -5.81060791015625, -5.569091796875, -5.32757568359375, -5.0860595703125, -4.84454345703125, -4.60302734375, -4.36151123046875, -4.1199951171875, -3.87847900390625, -3.636962890625, -3.39544677734375, -3.1539306640625, -2.91241455078125, -2.6708984375, -2.42938232421875, -2.1878662109375, -1.94635009765625, -1.704833984375, -1.46331787109375, -1.2218017578125, -0.98028564453125, -0.73876953125, -0.49725341796875, -0.2557373046875, -0.01422119140625, 0.227294921875, 0.46881103515625, 0.7103271484375, 0.95184326171875, 1.193359375, 1.43487548828125, 1.6763916015625, 1.91790771484375, 2.159423828125, 2.40093994140625, 2.6424560546875, 2.88397216796875, 3.12548828125, 3.36700439453125, 3.6085205078125, 3.85003662109375, 4.091552734375, 4.33306884765625, 4.5745849609375, 4.81610107421875, 5.0576171875, 5.29913330078125, 5.5406494140625, 5.78216552734375, 6.023681640625, 6.26519775390625, 6.5067138671875, 6.74822998046875, 6.98974609375, 7.23126220703125, 7.4727783203125, 7.71429443359375, 7.955810546875, 8.19732666015625, 8.4388427734375, 8.68035888671875, 8.921875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 12.0, 19.0, 21.0, 26.0, 33.0, 58.0, 71.0, 87.0, 144.0, 186.0, 279.0, 446.0, 636.0, 1069.0, 1707.0, 3228.0, 6819.0, 16721.0, 54748.0, 468319.0, 3496734.0, 98229.0, 25200.0, 9452.0, 4269.0, 2250.0, 1265.0, 753.0, 487.0, 332.0, 211.0, 136.0, 94.0, 60.0, 44.0, 38.0, 22.0, 22.0, 20.0, 10.0, 7.0, 7.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.65625, -36.44873046875, -35.2412109375, -34.03369140625, -32.826171875, -31.61865234375, -30.4111328125, -29.20361328125, -27.99609375, -26.78857421875, -25.5810546875, -24.37353515625, -23.166015625, -21.95849609375, -20.7509765625, -19.54345703125, -18.3359375, -17.12841796875, -15.9208984375, -14.71337890625, -13.505859375, -12.29833984375, -11.0908203125, -9.88330078125, -8.67578125, -7.46826171875, -6.2607421875, -5.05322265625, -3.845703125, -2.63818359375, -1.4306640625, -0.22314453125, 0.984375, 2.19189453125, 3.3994140625, 4.60693359375, 5.814453125, 7.02197265625, 8.2294921875, 9.43701171875, 10.64453125, 11.85205078125, 13.0595703125, 14.26708984375, 15.474609375, 16.68212890625, 17.8896484375, 19.09716796875, 20.3046875, 21.51220703125, 22.7197265625, 23.92724609375, 25.134765625, 26.34228515625, 27.5498046875, 28.75732421875, 29.96484375, 31.17236328125, 32.3798828125, 33.58740234375, 34.794921875, 36.00244140625, 37.2099609375, 38.41748046875, 39.625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 7.0, 10.0, 9.0, 13.0, 20.0, 31.0, 53.0, 83.0, 171.0, 598.0, 2431.0, 326.0, 125.0, 55.0, 40.0, 26.0, 21.0, 15.0, 7.0, 6.0, 8.0, 3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.71875, -22.092529296875, -21.46630859375, -20.840087890625, -20.2138671875, -19.587646484375, -18.96142578125, -18.335205078125, -17.708984375, -17.082763671875, -16.45654296875, -15.830322265625, -15.2041015625, -14.577880859375, -13.95166015625, -13.325439453125, -12.69921875, -12.072998046875, -11.44677734375, -10.820556640625, -10.1943359375, -9.568115234375, -8.94189453125, -8.315673828125, -7.689453125, -7.063232421875, -6.43701171875, -5.810791015625, -5.1845703125, -4.558349609375, -3.93212890625, -3.305908203125, -2.6796875, -2.053466796875, -1.42724609375, -0.801025390625, -0.1748046875, 0.451416015625, 1.07763671875, 1.703857421875, 2.330078125, 2.956298828125, 3.58251953125, 4.208740234375, 4.8349609375, 5.461181640625, 6.08740234375, 6.713623046875, 7.33984375, 7.966064453125, 8.59228515625, 9.218505859375, 9.8447265625, 10.470947265625, 11.09716796875, 11.723388671875, 12.349609375, 12.975830078125, 13.60205078125, 14.228271484375, 14.8544921875, 15.480712890625, 16.10693359375, 16.733154296875, 17.359375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 7.0, 16.0, 46.0, 92.0, 193.0, 266.0, 172.0, 96.0, 58.0, 23.0, 10.0, 10.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-181.18637084960938, -175.74212646484375, -170.29788208007812, -164.85362243652344, -159.4093780517578, -153.9651336669922, -148.52088928222656, -143.07662963867188, -137.63238525390625, -132.18814086914062, -126.74388885498047, -121.29964447021484, -115.85539245605469, -110.41114807128906, -104.96690368652344, -99.52265167236328, -94.07840728759766, -88.63416290283203, -83.18991088867188, -77.74566650390625, -72.3014144897461, -66.85717010498047, -61.41292190551758, -55.96867370605469, -50.5244255065918, -45.080177307128906, -39.635929107666016, -34.191680908203125, -28.747434616088867, -23.303186416625977, -17.85894012451172, -12.414691925048828, -6.9704437255859375, -1.526196002960205, 3.9180517196655273, 9.362298965454102, 14.806547164916992, 20.250795364379883, 25.69504165649414, 31.13928985595703, 36.58353805541992, 42.02778625488281, 47.4720344543457, 52.916282653808594, 58.36052703857422, 63.804779052734375, 69.2490234375, 74.69326782226562, 80.13751983642578, 85.5817642211914, 91.02601623535156, 96.47026062011719, 101.91451263427734, 107.35875701904297, 112.80300903320312, 118.24725341796875, 123.69149780273438, 129.1357421875, 134.57998657226562, 140.0242462158203, 145.46849060058594, 150.91273498535156, 156.3569793701172, 161.80123901367188, 167.2454833984375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 8.0, 7.0, 9.0, 12.0, 18.0, 19.0, 23.0, 25.0, 31.0, 29.0, 36.0, 32.0, 57.0, 45.0, 31.0, 53.0, 50.0, 34.0, 55.0, 56.0, 38.0, 35.0, 40.0, 40.0, 44.0, 36.0, 34.0, 23.0, 11.0, 9.0, 14.0, 11.0, 12.0, 3.0, 6.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-58.36979675292969, -56.436771392822266, -54.50374221801758, -52.570716857910156, -50.63768768310547, -48.70466232299805, -46.771636962890625, -44.83860778808594, -42.905582427978516, -40.972557067871094, -39.039527893066406, -37.106502532958984, -35.1734733581543, -33.240447998046875, -31.30742073059082, -29.374393463134766, -27.44136619567871, -25.508338928222656, -23.5753116607666, -21.642284393310547, -19.709259033203125, -17.77623176574707, -15.843204498291016, -13.910178184509277, -11.977150917053223, -10.044123649597168, -8.11109733581543, -6.178070068359375, -4.2450432777404785, -2.312016487121582, -0.37898921966552734, 1.554037094116211, 3.4870643615722656, 5.420091152191162, 7.353117942810059, 9.286145210266113, 11.219171524047852, 13.152198791503906, 15.085226058959961, 17.018253326416016, 18.951278686523438, 20.884305953979492, 22.817333221435547, 24.75035858154297, 26.683385848999023, 28.616413116455078, 30.549440383911133, 32.48246765136719, 34.415496826171875, 36.3485221862793, 38.281551361083984, 40.214576721191406, 42.147605895996094, 44.080631256103516, 46.01365661621094, 47.946685791015625, 49.87971115112305, 51.81273651123047, 53.745765686035156, 55.67879104614258, 57.611820220947266, 59.54484558105469, 61.477874755859375, 63.4109001159668, 65.34392547607422]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 8.0, 7.0, 18.0, 20.0, 36.0, 46.0, 73.0, 120.0, 167.0, 316.0, 580.0, 881.0, 1854.0, 3773.0, 7991.0, 18284.0, 48397.0, 145541.0, 437750.0, 254842.0, 77572.0, 27906.0, 11616.0, 5200.0, 2600.0, 1222.0, 694.0, 406.0, 233.0, 161.0, 98.0, 60.0, 23.0, 26.0, 11.0, 11.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.53125, -32.43994140625, -31.3486328125, -30.25732421875, -29.166015625, -28.07470703125, -26.9833984375, -25.89208984375, -24.80078125, -23.70947265625, -22.6181640625, -21.52685546875, -20.435546875, -19.34423828125, -18.2529296875, -17.16162109375, -16.0703125, -14.97900390625, -13.8876953125, -12.79638671875, -11.705078125, -10.61376953125, -9.5224609375, -8.43115234375, -7.33984375, -6.24853515625, -5.1572265625, -4.06591796875, -2.974609375, -1.88330078125, -0.7919921875, 0.29931640625, 1.390625, 2.48193359375, 3.5732421875, 4.66455078125, 5.755859375, 6.84716796875, 7.9384765625, 9.02978515625, 10.12109375, 11.21240234375, 12.3037109375, 13.39501953125, 14.486328125, 15.57763671875, 16.6689453125, 17.76025390625, 18.8515625, 19.94287109375, 21.0341796875, 22.12548828125, 23.216796875, 24.30810546875, 25.3994140625, 26.49072265625, 27.58203125, 28.67333984375, 29.7646484375, 30.85595703125, 31.947265625, 33.03857421875, 34.1298828125, 35.22119140625, 36.3125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 2.0, 13.0, 7.0, 9.0, 19.0, 16.0, 22.0, 23.0, 21.0, 31.0, 31.0, 31.0, 38.0, 40.0, 42.0, 40.0, 55.0, 40.0, 43.0, 47.0, 55.0, 52.0, 54.0, 19.0, 39.0, 28.0, 34.0, 26.0, 23.0, 18.0, 11.0, 19.0, 14.0, 8.0, 6.0, 7.0, 4.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.6640625, -6.4271240234375, -6.190185546875, -5.9532470703125, -5.71630859375, -5.4793701171875, -5.242431640625, -5.0054931640625, -4.7685546875, -4.5316162109375, -4.294677734375, -4.0577392578125, -3.82080078125, -3.5838623046875, -3.346923828125, -3.1099853515625, -2.873046875, -2.6361083984375, -2.399169921875, -2.1622314453125, -1.92529296875, -1.6883544921875, -1.451416015625, -1.2144775390625, -0.9775390625, -0.7406005859375, -0.503662109375, -0.2667236328125, -0.02978515625, 0.2071533203125, 0.444091796875, 0.6810302734375, 0.91796875, 1.1549072265625, 1.391845703125, 1.6287841796875, 1.86572265625, 2.1026611328125, 2.339599609375, 2.5765380859375, 2.8134765625, 3.0504150390625, 3.287353515625, 3.5242919921875, 3.76123046875, 3.9981689453125, 4.235107421875, 4.4720458984375, 4.708984375, 4.9459228515625, 5.182861328125, 5.4197998046875, 5.65673828125, 5.8936767578125, 6.130615234375, 6.3675537109375, 6.6044921875, 6.8414306640625, 7.078369140625, 7.3153076171875, 7.55224609375, 7.7891845703125, 8.026123046875, 8.2630615234375, 8.5]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 9.0, 10.0, 11.0, 21.0, 25.0, 38.0, 33.0, 55.0, 96.0, 161.0, 281.0, 552.0, 1066.0, 2681.0, 7425.0, 24988.0, 106390.0, 571189.0, 261398.0, 50500.0, 13576.0, 4486.0, 1755.0, 808.0, 424.0, 199.0, 131.0, 78.0, 56.0, 34.0, 17.0, 12.0, 14.0, 10.0, 8.0, 3.0, 5.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.96875, -38.4169921875, -36.865234375, -35.3134765625, -33.76171875, -32.2099609375, -30.658203125, -29.1064453125, -27.5546875, -26.0029296875, -24.451171875, -22.8994140625, -21.34765625, -19.7958984375, -18.244140625, -16.6923828125, -15.140625, -13.5888671875, -12.037109375, -10.4853515625, -8.93359375, -7.3818359375, -5.830078125, -4.2783203125, -2.7265625, -1.1748046875, 0.376953125, 1.9287109375, 3.48046875, 5.0322265625, 6.583984375, 8.1357421875, 9.6875, 11.2392578125, 12.791015625, 14.3427734375, 15.89453125, 17.4462890625, 18.998046875, 20.5498046875, 22.1015625, 23.6533203125, 25.205078125, 26.7568359375, 28.30859375, 29.8603515625, 31.412109375, 32.9638671875, 34.515625, 36.0673828125, 37.619140625, 39.1708984375, 40.72265625, 42.2744140625, 43.826171875, 45.3779296875, 46.9296875, 48.4814453125, 50.033203125, 51.5849609375, 53.13671875, 54.6884765625, 56.240234375, 57.7919921875, 59.34375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 6.0, 9.0, 9.0, 12.0, 7.0, 12.0, 20.0, 21.0, 27.0, 24.0, 29.0, 38.0, 29.0, 39.0, 39.0, 38.0, 48.0, 56.0, 48.0, 68.0, 41.0, 42.0, 45.0, 36.0, 26.0, 28.0, 29.0, 34.0, 23.0, 24.0, 14.0, 11.0, 18.0, 13.0, 3.0, 7.0, 2.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.59375, -31.5576171875, -30.521484375, -29.4853515625, -28.44921875, -27.4130859375, -26.376953125, -25.3408203125, -24.3046875, -23.2685546875, -22.232421875, -21.1962890625, -20.16015625, -19.1240234375, -18.087890625, -17.0517578125, -16.015625, -14.9794921875, -13.943359375, -12.9072265625, -11.87109375, -10.8349609375, -9.798828125, -8.7626953125, -7.7265625, -6.6904296875, -5.654296875, -4.6181640625, -3.58203125, -2.5458984375, -1.509765625, -0.4736328125, 0.5625, 1.5986328125, 2.634765625, 3.6708984375, 4.70703125, 5.7431640625, 6.779296875, 7.8154296875, 8.8515625, 9.8876953125, 10.923828125, 11.9599609375, 12.99609375, 14.0322265625, 15.068359375, 16.1044921875, 17.140625, 18.1767578125, 19.212890625, 20.2490234375, 21.28515625, 22.3212890625, 23.357421875, 24.3935546875, 25.4296875, 26.4658203125, 27.501953125, 28.5380859375, 29.57421875, 30.6103515625, 31.646484375, 32.6826171875, 33.71875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 4.0, 3.0, 10.0, 9.0, 8.0, 16.0, 15.0, 33.0, 39.0, 78.0, 116.0, 224.0, 347.0, 638.0, 1143.0, 2547.0, 6981.0, 24452.0, 141440.0, 688743.0, 144047.0, 24945.0, 7301.0, 2686.0, 1229.0, 640.0, 354.0, 203.0, 96.0, 63.0, 47.0, 27.0, 22.0, 15.0, 8.0, 6.0, 5.0, 4.0, 8.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-22.359375, -21.7786865234375, -21.197998046875, -20.6173095703125, -20.03662109375, -19.4559326171875, -18.875244140625, -18.2945556640625, -17.7138671875, -17.1331787109375, -16.552490234375, -15.9718017578125, -15.39111328125, -14.8104248046875, -14.229736328125, -13.6490478515625, -13.068359375, -12.4876708984375, -11.906982421875, -11.3262939453125, -10.74560546875, -10.1649169921875, -9.584228515625, -9.0035400390625, -8.4228515625, -7.8421630859375, -7.261474609375, -6.6807861328125, -6.10009765625, -5.5194091796875, -4.938720703125, -4.3580322265625, -3.77734375, -3.1966552734375, -2.615966796875, -2.0352783203125, -1.45458984375, -0.8739013671875, -0.293212890625, 0.2874755859375, 0.8681640625, 1.4488525390625, 2.029541015625, 2.6102294921875, 3.19091796875, 3.7716064453125, 4.352294921875, 4.9329833984375, 5.513671875, 6.0943603515625, 6.675048828125, 7.2557373046875, 7.83642578125, 8.4171142578125, 8.997802734375, 9.5784912109375, 10.1591796875, 10.7398681640625, 11.320556640625, 11.9012451171875, 12.48193359375, 13.0626220703125, 13.643310546875, 14.2239990234375, 14.8046875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 1.0, 4.0, 7.0, 5.0, 9.0, 9.0, 17.0, 11.0, 27.0, 34.0, 43.0, 78.0, 121.0, 165.0, 139.0, 102.0, 72.0, 38.0, 28.0, 20.0, 11.0, 9.0, 11.0, 6.0, 10.0, 8.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003124237060546875, -0.00302886962890625, -0.002933502197265625, -0.002838134765625, -0.002742767333984375, -0.00264739990234375, -0.002552032470703125, -0.0024566650390625, -0.002361297607421875, -0.00226593017578125, -0.002170562744140625, -0.0020751953125, -0.001979827880859375, -0.00188446044921875, -0.001789093017578125, -0.0016937255859375, -0.001598358154296875, -0.00150299072265625, -0.001407623291015625, -0.001312255859375, -0.001216888427734375, -0.00112152099609375, -0.001026153564453125, -0.0009307861328125, -0.000835418701171875, -0.00074005126953125, -0.000644683837890625, -0.00054931640625, -0.000453948974609375, -0.00035858154296875, -0.000263214111328125, -0.0001678466796875, -7.2479248046875e-05, 2.288818359375e-05, 0.000118255615234375, 0.000213623046875, 0.000308990478515625, 0.00040435791015625, 0.000499725341796875, 0.0005950927734375, 0.000690460205078125, 0.00078582763671875, 0.000881195068359375, 0.0009765625, 0.001071929931640625, 0.00116729736328125, 0.001262664794921875, 0.0013580322265625, 0.001453399658203125, 0.00154876708984375, 0.001644134521484375, 0.001739501953125, 0.001834869384765625, 0.00193023681640625, 0.002025604248046875, 0.0021209716796875, 0.002216339111328125, 0.00231170654296875, 0.002407073974609375, 0.00250244140625, 0.002597808837890625, 0.00269317626953125, 0.002788543701171875, 0.0028839111328125, 0.002979278564453125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 2.0, 6.0, 7.0, 7.0, 21.0, 29.0, 39.0, 57.0, 84.0, 131.0, 206.0, 361.0, 612.0, 1305.0, 2908.0, 8774.0, 40566.0, 399079.0, 527342.0, 50458.0, 10300.0, 3266.0, 1373.0, 655.0, 349.0, 221.0, 132.0, 89.0, 51.0, 33.0, 25.0, 12.0, 16.0, 11.0, 8.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.421875, -15.81494140625, -15.2080078125, -14.60107421875, -13.994140625, -13.38720703125, -12.7802734375, -12.17333984375, -11.56640625, -10.95947265625, -10.3525390625, -9.74560546875, -9.138671875, -8.53173828125, -7.9248046875, -7.31787109375, -6.7109375, -6.10400390625, -5.4970703125, -4.89013671875, -4.283203125, -3.67626953125, -3.0693359375, -2.46240234375, -1.85546875, -1.24853515625, -0.6416015625, -0.03466796875, 0.572265625, 1.17919921875, 1.7861328125, 2.39306640625, 3.0, 3.60693359375, 4.2138671875, 4.82080078125, 5.427734375, 6.03466796875, 6.6416015625, 7.24853515625, 7.85546875, 8.46240234375, 9.0693359375, 9.67626953125, 10.283203125, 10.89013671875, 11.4970703125, 12.10400390625, 12.7109375, 13.31787109375, 13.9248046875, 14.53173828125, 15.138671875, 15.74560546875, 16.3525390625, 16.95947265625, 17.56640625, 18.17333984375, 18.7802734375, 19.38720703125, 19.994140625, 20.60107421875, 21.2080078125, 21.81494140625, 22.421875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 5.0, 10.0, 10.0, 11.0, 19.0, 21.0, 30.0, 37.0, 37.0, 48.0, 83.0, 90.0, 94.0, 86.0, 88.0, 75.0, 53.0, 52.0, 29.0, 20.0, 13.0, 12.0, 18.0, 11.0, 6.0, 11.0, 4.0, 7.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-13.0, -12.5496826171875, -12.099365234375, -11.6490478515625, -11.19873046875, -10.7484130859375, -10.298095703125, -9.8477783203125, -9.3974609375, -8.9471435546875, -8.496826171875, -8.0465087890625, -7.59619140625, -7.1458740234375, -6.695556640625, -6.2452392578125, -5.794921875, -5.3446044921875, -4.894287109375, -4.4439697265625, -3.99365234375, -3.5433349609375, -3.093017578125, -2.6427001953125, -2.1923828125, -1.7420654296875, -1.291748046875, -0.8414306640625, -0.39111328125, 0.0592041015625, 0.509521484375, 0.9598388671875, 1.41015625, 1.8604736328125, 2.310791015625, 2.7611083984375, 3.21142578125, 3.6617431640625, 4.112060546875, 4.5623779296875, 5.0126953125, 5.4630126953125, 5.913330078125, 6.3636474609375, 6.81396484375, 7.2642822265625, 7.714599609375, 8.1649169921875, 8.615234375, 9.0655517578125, 9.515869140625, 9.9661865234375, 10.41650390625, 10.8668212890625, 11.317138671875, 11.7674560546875, 12.2177734375, 12.6680908203125, 13.118408203125, 13.5687255859375, 14.01904296875, 14.4693603515625, 14.919677734375, 15.3699951171875, 15.8203125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 12.0, 60.0, 319.0, 423.0, 140.0, 41.0, 7.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1461.43603515625, -1431.745849609375, -1402.0555419921875, -1372.3653564453125, -1342.6751708984375, -1312.9849853515625, -1283.294677734375, -1253.6044921875, -1223.914306640625, -1194.22412109375, -1164.5338134765625, -1134.8436279296875, -1105.1534423828125, -1075.4632568359375, -1045.77294921875, -1016.082763671875, -986.3925170898438, -956.7022705078125, -927.0120849609375, -897.3218383789062, -867.6316528320312, -837.94140625, -808.251220703125, -778.5609741210938, -748.8707275390625, -719.1804809570312, -689.4902954101562, -659.800048828125, -630.10986328125, -600.4196166992188, -570.7293701171875, -541.0391845703125, -511.34906005859375, -481.6588439941406, -451.9686279296875, -422.27838134765625, -392.58819580078125, -362.89794921875, -333.2077331542969, -303.51751708984375, -273.8273010253906, -244.1370849609375, -214.44686889648438, -184.7566375732422, -155.06642150878906, -125.37620544433594, -95.68597412109375, -65.99575805664062, -36.3055419921875, -6.615322113037109, 23.07489776611328, 52.76512145996094, 82.45533752441406, 112.14555358886719, 141.83578491210938, 171.5260009765625, 201.21621704101562, 230.90643310546875, 260.5966491699219, 290.286865234375, 319.97711181640625, 349.66729736328125, 379.3575439453125, 409.0477600097656, 438.73797607421875]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 5.0, 4.0, 8.0, 6.0, 8.0, 8.0, 8.0, 6.0, 10.0, 8.0, 27.0, 22.0, 28.0, 25.0, 25.0, 21.0, 16.0, 35.0, 30.0, 36.0, 41.0, 36.0, 35.0, 39.0, 39.0, 35.0, 37.0, 28.0, 37.0, 32.0, 39.0, 32.0, 26.0, 20.0, 25.0, 27.0, 21.0, 18.0, 15.0, 9.0, 13.0, 14.0, 10.0, 5.0, 4.0, 11.0, 4.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0], "bins": [-142.39508056640625, -138.1282196044922, -133.86134338378906, -129.594482421875, -125.3276138305664, -121.06074523925781, -116.79388427734375, -112.52701568603516, -108.26014709472656, -103.99327850341797, -99.7264175415039, -95.45954895019531, -91.19268035888672, -86.92581176757812, -82.65895080566406, -78.39208221435547, -74.1252212524414, -69.85835266113281, -65.59149169921875, -61.324623107910156, -57.05775451660156, -52.790889739990234, -48.524024963378906, -44.25715637207031, -39.990291595458984, -35.723426818847656, -31.456558227539062, -27.189693450927734, -22.922826766967773, -18.655960083007812, -14.389095306396484, -10.122228622436523, -5.8553619384765625, -1.5884957313537598, 2.678370475769043, 6.9452362060546875, 11.212102890014648, 15.47896957397461, 19.745834350585938, 24.0127010345459, 28.27956771850586, 32.54643249511719, 36.81330108642578, 41.08016586303711, 45.34703063964844, 49.61389923095703, 53.88076400756836, 58.14762878417969, 62.41449737548828, 66.68136596679688, 70.94822692871094, 75.21509552001953, 79.48196411132812, 83.74882507324219, 88.01569366455078, 92.28256225585938, 96.54942321777344, 100.81629180908203, 105.0831527709961, 109.35002136230469, 113.61688995361328, 117.88375854492188, 122.15061950683594, 126.41748809814453, 130.68435668945312]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 4.0, 2.0, 9.0, 5.0, 4.0, 9.0, 16.0, 13.0, 27.0, 27.0, 42.0, 45.0, 91.0, 154.0, 211.0, 357.0, 661.0, 1048.0, 1831.0, 3352.0, 7045.0, 16516.0, 53239.0, 3343265.0, 690184.0, 46944.0, 14779.0, 6658.0, 3425.0, 1793.0, 1048.0, 573.0, 316.0, 200.0, 127.0, 81.0, 57.0, 34.0, 33.0, 14.0, 10.0, 17.0, 8.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.9375, -42.3076171875, -40.677734375, -39.0478515625, -37.41796875, -35.7880859375, -34.158203125, -32.5283203125, -30.8984375, -29.2685546875, -27.638671875, -26.0087890625, -24.37890625, -22.7490234375, -21.119140625, -19.4892578125, -17.859375, -16.2294921875, -14.599609375, -12.9697265625, -11.33984375, -9.7099609375, -8.080078125, -6.4501953125, -4.8203125, -3.1904296875, -1.560546875, 0.0693359375, 1.69921875, 3.3291015625, 4.958984375, 6.5888671875, 8.21875, 9.8486328125, 11.478515625, 13.1083984375, 14.73828125, 16.3681640625, 17.998046875, 19.6279296875, 21.2578125, 22.8876953125, 24.517578125, 26.1474609375, 27.77734375, 29.4072265625, 31.037109375, 32.6669921875, 34.296875, 35.9267578125, 37.556640625, 39.1865234375, 40.81640625, 42.4462890625, 44.076171875, 45.7060546875, 47.3359375, 48.9658203125, 50.595703125, 52.2255859375, 53.85546875, 55.4853515625, 57.115234375, 58.7451171875, 60.375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 7.0, 9.0, 5.0, 12.0, 13.0, 7.0, 16.0, 15.0, 28.0, 22.0, 34.0, 32.0, 33.0, 30.0, 42.0, 41.0, 38.0, 44.0, 40.0, 48.0, 51.0, 44.0, 51.0, 41.0, 29.0, 28.0, 26.0, 29.0, 32.0, 18.0, 17.0, 32.0, 14.0, 14.0, 10.0, 5.0, 5.0, 10.0, 10.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.625, -6.383056640625, -6.14111328125, -5.899169921875, -5.6572265625, -5.415283203125, -5.17333984375, -4.931396484375, -4.689453125, -4.447509765625, -4.20556640625, -3.963623046875, -3.7216796875, -3.479736328125, -3.23779296875, -2.995849609375, -2.75390625, -2.511962890625, -2.27001953125, -2.028076171875, -1.7861328125, -1.544189453125, -1.30224609375, -1.060302734375, -0.818359375, -0.576416015625, -0.33447265625, -0.092529296875, 0.1494140625, 0.391357421875, 0.63330078125, 0.875244140625, 1.1171875, 1.359130859375, 1.60107421875, 1.843017578125, 2.0849609375, 2.326904296875, 2.56884765625, 2.810791015625, 3.052734375, 3.294677734375, 3.53662109375, 3.778564453125, 4.0205078125, 4.262451171875, 4.50439453125, 4.746337890625, 4.98828125, 5.230224609375, 5.47216796875, 5.714111328125, 5.9560546875, 6.197998046875, 6.43994140625, 6.681884765625, 6.923828125, 7.165771484375, 7.40771484375, 7.649658203125, 7.8916015625, 8.133544921875, 8.37548828125, 8.617431640625, 8.859375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 10.0, 15.0, 25.0, 30.0, 59.0, 50.0, 115.0, 134.0, 210.0, 318.0, 457.0, 715.0, 1019.0, 1581.0, 2536.0, 4225.0, 7015.0, 12793.0, 25868.0, 61239.0, 222752.0, 3496818.0, 235190.0, 63124.0, 26360.0, 13047.0, 7105.0, 4141.0, 2579.0, 1615.0, 1014.0, 670.0, 465.0, 304.0, 204.0, 122.0, 103.0, 77.0, 60.0, 26.0, 28.0, 11.0, 12.0, 11.0, 10.0, 3.0, 2.0, 5.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-25.671875, -24.802001953125, -23.93212890625, -23.062255859375, -22.1923828125, -21.322509765625, -20.45263671875, -19.582763671875, -18.712890625, -17.843017578125, -16.97314453125, -16.103271484375, -15.2333984375, -14.363525390625, -13.49365234375, -12.623779296875, -11.75390625, -10.884033203125, -10.01416015625, -9.144287109375, -8.2744140625, -7.404541015625, -6.53466796875, -5.664794921875, -4.794921875, -3.925048828125, -3.05517578125, -2.185302734375, -1.3154296875, -0.445556640625, 0.42431640625, 1.294189453125, 2.1640625, 3.033935546875, 3.90380859375, 4.773681640625, 5.6435546875, 6.513427734375, 7.38330078125, 8.253173828125, 9.123046875, 9.992919921875, 10.86279296875, 11.732666015625, 12.6025390625, 13.472412109375, 14.34228515625, 15.212158203125, 16.08203125, 16.951904296875, 17.82177734375, 18.691650390625, 19.5615234375, 20.431396484375, 21.30126953125, 22.171142578125, 23.041015625, 23.910888671875, 24.78076171875, 25.650634765625, 26.5205078125, 27.390380859375, 28.26025390625, 29.130126953125, 30.0]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 6.0, 4.0, 7.0, 5.0, 7.0, 6.0, 12.0, 16.0, 17.0, 21.0, 30.0, 37.0, 61.0, 97.0, 218.0, 1169.0, 1766.0, 205.0, 102.0, 69.0, 51.0, 37.0, 29.0, 19.0, 14.0, 14.0, 6.0, 10.0, 8.0, 6.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.953125, -16.482421875, -16.01171875, -15.541015625, -15.0703125, -14.599609375, -14.12890625, -13.658203125, -13.1875, -12.716796875, -12.24609375, -11.775390625, -11.3046875, -10.833984375, -10.36328125, -9.892578125, -9.421875, -8.951171875, -8.48046875, -8.009765625, -7.5390625, -7.068359375, -6.59765625, -6.126953125, -5.65625, -5.185546875, -4.71484375, -4.244140625, -3.7734375, -3.302734375, -2.83203125, -2.361328125, -1.890625, -1.419921875, -0.94921875, -0.478515625, -0.0078125, 0.462890625, 0.93359375, 1.404296875, 1.875, 2.345703125, 2.81640625, 3.287109375, 3.7578125, 4.228515625, 4.69921875, 5.169921875, 5.640625, 6.111328125, 6.58203125, 7.052734375, 7.5234375, 7.994140625, 8.46484375, 8.935546875, 9.40625, 9.876953125, 10.34765625, 10.818359375, 11.2890625, 11.759765625, 12.23046875, 12.701171875, 13.171875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 11.0, 63.0, 423.0, 412.0, 76.0, 15.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-413.303955078125, -399.91461181640625, -386.5252380371094, -373.1358947753906, -359.74652099609375, -346.357177734375, -332.96783447265625, -319.5784912109375, -306.1891174316406, -292.7997741699219, -279.410400390625, -266.02105712890625, -252.63169860839844, -239.24234008789062, -225.85299682617188, -212.46363830566406, -199.07427978515625, -185.68492126464844, -172.29556274414062, -158.90621948242188, -145.51686096191406, -132.12750244140625, -118.73815155029297, -105.34880065917969, -91.95944213867188, -78.57008361816406, -65.18073272705078, -51.791378021240234, -38.40202331542969, -25.012664794921875, -11.623313903808594, 1.7660369873046875, 15.155364990234375, 28.544719696044922, 41.93407440185547, 55.323429107666016, 68.71278381347656, 82.10214233398438, 95.49149322509766, 108.88084411621094, 122.27020263671875, 135.65956115722656, 149.04891967773438, 162.43826293945312, 175.82762145996094, 189.21697998046875, 202.6063232421875, 215.9956817626953, 229.38504028320312, 242.77439880371094, 256.16375732421875, 269.5531005859375, 282.94244384765625, 296.3318176269531, 309.7211608886719, 323.11053466796875, 336.4998779296875, 349.88922119140625, 363.2785949707031, 376.6679382324219, 390.05731201171875, 403.4466552734375, 416.83599853515625, 430.225341796875, 443.6147155761719]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 2.0, 3.0, 6.0, 5.0, 4.0, 7.0, 23.0, 26.0, 24.0, 33.0, 38.0, 42.0, 46.0, 44.0, 73.0, 63.0, 51.0, 45.0, 53.0, 62.0, 50.0, 64.0, 50.0, 34.0, 39.0, 21.0, 28.0, 14.0, 21.0, 7.0, 12.0, 2.0, 6.0, 3.0, 5.0, 1.0, 3.0, 1.0], "bins": [-99.22796630859375, -96.93639373779297, -94.64482116699219, -92.35325622558594, -90.06168365478516, -87.77011108398438, -85.47854614257812, -83.18697357177734, -80.89540100097656, -78.60382843017578, -76.312255859375, -74.02069091796875, -71.72911834716797, -69.43754577636719, -67.14598083496094, -64.85440826416016, -62.562835693359375, -60.271263122558594, -57.97969436645508, -55.68812561035156, -53.39655303955078, -51.10498046875, -48.813411712646484, -46.52184295654297, -44.23027038574219, -41.938697814941406, -39.64712905883789, -37.355560302734375, -35.063987731933594, -32.77241516113281, -30.480846405029297, -28.18927574157715, -25.89771270751953, -23.606142044067383, -21.314571380615234, -19.023000717163086, -16.731430053710938, -14.439859390258789, -12.14828872680664, -9.856718063354492, -7.565147399902344, -5.273576736450195, -2.982006072998047, -0.6904354095458984, 1.60113525390625, 3.8927059173583984, 6.184276580810547, 8.475847244262695, 10.767417907714844, 13.058988571166992, 15.35055923461914, 17.64212989807129, 19.933700561523438, 22.225271224975586, 24.516841888427734, 26.808412551879883, 29.09998321533203, 31.39155387878418, 33.68312454223633, 35.974693298339844, 38.266265869140625, 40.557838439941406, 42.84940719604492, 45.14097595214844, 47.43254852294922]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 3.0, 7.0, 8.0, 9.0, 12.0, 16.0, 25.0, 29.0, 54.0, 94.0, 94.0, 153.0, 243.0, 366.0, 570.0, 839.0, 1338.0, 1994.0, 3194.0, 5418.0, 9289.0, 16436.0, 30483.0, 60585.0, 130843.0, 297369.0, 260604.0, 112617.0, 52913.0, 26895.0, 14462.0, 8349.0, 4964.0, 2949.0, 1825.0, 1192.0, 764.0, 502.0, 351.0, 230.0, 173.0, 86.0, 72.0, 41.0, 37.0, 19.0, 13.0, 5.0, 7.0, 10.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-29.109375, -28.135986328125, -27.16259765625, -26.189208984375, -25.2158203125, -24.242431640625, -23.26904296875, -22.295654296875, -21.322265625, -20.348876953125, -19.37548828125, -18.402099609375, -17.4287109375, -16.455322265625, -15.48193359375, -14.508544921875, -13.53515625, -12.561767578125, -11.58837890625, -10.614990234375, -9.6416015625, -8.668212890625, -7.69482421875, -6.721435546875, -5.748046875, -4.774658203125, -3.80126953125, -2.827880859375, -1.8544921875, -0.881103515625, 0.09228515625, 1.065673828125, 2.0390625, 3.012451171875, 3.98583984375, 4.959228515625, 5.9326171875, 6.906005859375, 7.87939453125, 8.852783203125, 9.826171875, 10.799560546875, 11.77294921875, 12.746337890625, 13.7197265625, 14.693115234375, 15.66650390625, 16.639892578125, 17.61328125, 18.586669921875, 19.56005859375, 20.533447265625, 21.5068359375, 22.480224609375, 23.45361328125, 24.427001953125, 25.400390625, 26.373779296875, 27.34716796875, 28.320556640625, 29.2939453125, 30.267333984375, 31.24072265625, 32.214111328125, 33.1875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 8.0, 7.0, 4.0, 9.0, 13.0, 10.0, 18.0, 20.0, 29.0, 28.0, 25.0, 34.0, 30.0, 58.0, 48.0, 56.0, 51.0, 50.0, 61.0, 52.0, 47.0, 40.0, 35.0, 38.0, 42.0, 44.0, 24.0, 24.0, 16.0, 20.0, 17.0, 12.0, 8.0, 6.0, 12.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.6328125, -9.3331298828125, -9.033447265625, -8.7337646484375, -8.43408203125, -8.1343994140625, -7.834716796875, -7.5350341796875, -7.2353515625, -6.9356689453125, -6.635986328125, -6.3363037109375, -6.03662109375, -5.7369384765625, -5.437255859375, -5.1375732421875, -4.837890625, -4.5382080078125, -4.238525390625, -3.9388427734375, -3.63916015625, -3.3394775390625, -3.039794921875, -2.7401123046875, -2.4404296875, -2.1407470703125, -1.841064453125, -1.5413818359375, -1.24169921875, -0.9420166015625, -0.642333984375, -0.3426513671875, -0.04296875, 0.2567138671875, 0.556396484375, 0.8560791015625, 1.15576171875, 1.4554443359375, 1.755126953125, 2.0548095703125, 2.3544921875, 2.6541748046875, 2.953857421875, 3.2535400390625, 3.55322265625, 3.8529052734375, 4.152587890625, 4.4522705078125, 4.751953125, 5.0516357421875, 5.351318359375, 5.6510009765625, 5.95068359375, 6.2503662109375, 6.550048828125, 6.8497314453125, 7.1494140625, 7.4490966796875, 7.748779296875, 8.0484619140625, 8.34814453125, 8.6478271484375, 8.947509765625, 9.2471923828125, 9.546875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 10.0, 3.0, 7.0, 22.0, 20.0, 57.0, 77.0, 95.0, 199.0, 501.0, 1340.0, 5678.0, 51115.0, 839391.0, 136237.0, 10569.0, 1954.0, 640.0, 280.0, 139.0, 74.0, 56.0, 34.0, 21.0, 9.0, 4.0, 2.0, 3.0, 7.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.25, -121.02734375, -116.8046875, -112.58203125, -108.359375, -104.13671875, -99.9140625, -95.69140625, -91.46875, -87.24609375, -83.0234375, -78.80078125, -74.578125, -70.35546875, -66.1328125, -61.91015625, -57.6875, -53.46484375, -49.2421875, -45.01953125, -40.796875, -36.57421875, -32.3515625, -28.12890625, -23.90625, -19.68359375, -15.4609375, -11.23828125, -7.015625, -2.79296875, 1.4296875, 5.65234375, 9.875, 14.09765625, 18.3203125, 22.54296875, 26.765625, 30.98828125, 35.2109375, 39.43359375, 43.65625, 47.87890625, 52.1015625, 56.32421875, 60.546875, 64.76953125, 68.9921875, 73.21484375, 77.4375, 81.66015625, 85.8828125, 90.10546875, 94.328125, 98.55078125, 102.7734375, 106.99609375, 111.21875, 115.44140625, 119.6640625, 123.88671875, 128.109375, 132.33203125, 136.5546875, 140.77734375, 145.0]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 7.0, 9.0, 7.0, 6.0, 19.0, 33.0, 41.0, 49.0, 40.0, 70.0, 68.0, 90.0, 85.0, 77.0, 83.0, 63.0, 43.0, 52.0, 47.0, 26.0, 29.0, 17.0, 15.0, 8.0, 4.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.4375, -63.234375, -61.03125, -58.828125, -56.625, -54.421875, -52.21875, -50.015625, -47.8125, -45.609375, -43.40625, -41.203125, -39.0, -36.796875, -34.59375, -32.390625, -30.1875, -27.984375, -25.78125, -23.578125, -21.375, -19.171875, -16.96875, -14.765625, -12.5625, -10.359375, -8.15625, -5.953125, -3.75, -1.546875, 0.65625, 2.859375, 5.0625, 7.265625, 9.46875, 11.671875, 13.875, 16.078125, 18.28125, 20.484375, 22.6875, 24.890625, 27.09375, 29.296875, 31.5, 33.703125, 35.90625, 38.109375, 40.3125, 42.515625, 44.71875, 46.921875, 49.125, 51.328125, 53.53125, 55.734375, 57.9375, 60.140625, 62.34375, 64.546875, 66.75, 68.953125, 71.15625, 73.359375, 75.5625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 7.0, 5.0, 4.0, 7.0, 9.0, 18.0, 26.0, 47.0, 64.0, 99.0, 173.0, 340.0, 738.0, 1831.0, 6184.0, 31308.0, 483162.0, 483684.0, 31210.0, 6172.0, 1874.0, 821.0, 323.0, 195.0, 117.0, 45.0, 36.0, 18.0, 14.0, 10.0, 4.0, 5.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-52.0625, -50.53125, -49.0, -47.46875, -45.9375, -44.40625, -42.875, -41.34375, -39.8125, -38.28125, -36.75, -35.21875, -33.6875, -32.15625, -30.625, -29.09375, -27.5625, -26.03125, -24.5, -22.96875, -21.4375, -19.90625, -18.375, -16.84375, -15.3125, -13.78125, -12.25, -10.71875, -9.1875, -7.65625, -6.125, -4.59375, -3.0625, -1.53125, 0.0, 1.53125, 3.0625, 4.59375, 6.125, 7.65625, 9.1875, 10.71875, 12.25, 13.78125, 15.3125, 16.84375, 18.375, 19.90625, 21.4375, 22.96875, 24.5, 26.03125, 27.5625, 29.09375, 30.625, 32.15625, 33.6875, 35.21875, 36.75, 38.28125, 39.8125, 41.34375, 42.875, 44.40625, 45.9375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 4.0, 13.0, 16.0, 36.0, 52.0, 76.0, 126.0, 256.0, 166.0, 94.0, 71.0, 34.0, 17.0, 7.0, 12.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0079498291015625, -0.007719993591308594, -0.0074901580810546875, -0.007260322570800781, -0.007030487060546875, -0.006800651550292969, -0.0065708160400390625, -0.006340980529785156, -0.00611114501953125, -0.005881309509277344, -0.0056514739990234375, -0.005421638488769531, -0.005191802978515625, -0.004961967468261719, -0.0047321319580078125, -0.004502296447753906, -0.0042724609375, -0.004042625427246094, -0.0038127899169921875, -0.0035829544067382812, -0.003353118896484375, -0.0031232833862304688, -0.0028934478759765625, -0.0026636123657226562, -0.00243377685546875, -0.0022039413452148438, -0.0019741058349609375, -0.0017442703247070312, -0.001514434814453125, -0.0012845993041992188, -0.0010547637939453125, -0.0008249282836914062, -0.0005950927734375, -0.00036525726318359375, -0.0001354217529296875, 9.441375732421875e-05, 0.000324249267578125, 0.0005540847778320312, 0.0007839202880859375, 0.0010137557983398438, 0.00124359130859375, 0.0014734268188476562, 0.0017032623291015625, 0.0019330978393554688, 0.002162933349609375, 0.0023927688598632812, 0.0026226043701171875, 0.0028524398803710938, 0.003082275390625, 0.0033121109008789062, 0.0035419464111328125, 0.0037717819213867188, 0.004001617431640625, 0.004231452941894531, 0.0044612884521484375, 0.004691123962402344, 0.00492095947265625, 0.005150794982910156, 0.0053806304931640625, 0.005610466003417969, 0.005840301513671875, 0.006070137023925781, 0.0062999725341796875, 0.006529808044433594, 0.0067596435546875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 4.0, 5.0, 17.0, 25.0, 35.0, 54.0, 88.0, 173.0, 342.0, 827.0, 3347.0, 32361.0, 896694.0, 106188.0, 6182.0, 1226.0, 467.0, 218.0, 121.0, 67.0, 34.0, 29.0, 20.0, 5.0, 7.0, 3.0, 6.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-82.25, -80.1767578125, -78.103515625, -76.0302734375, -73.95703125, -71.8837890625, -69.810546875, -67.7373046875, -65.6640625, -63.5908203125, -61.517578125, -59.4443359375, -57.37109375, -55.2978515625, -53.224609375, -51.1513671875, -49.078125, -47.0048828125, -44.931640625, -42.8583984375, -40.78515625, -38.7119140625, -36.638671875, -34.5654296875, -32.4921875, -30.4189453125, -28.345703125, -26.2724609375, -24.19921875, -22.1259765625, -20.052734375, -17.9794921875, -15.90625, -13.8330078125, -11.759765625, -9.6865234375, -7.61328125, -5.5400390625, -3.466796875, -1.3935546875, 0.6796875, 2.7529296875, 4.826171875, 6.8994140625, 8.97265625, 11.0458984375, 13.119140625, 15.1923828125, 17.265625, 19.3388671875, 21.412109375, 23.4853515625, 25.55859375, 27.6318359375, 29.705078125, 31.7783203125, 33.8515625, 35.9248046875, 37.998046875, 40.0712890625, 42.14453125, 44.2177734375, 46.291015625, 48.3642578125, 50.4375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 1.0, 8.0, 14.0, 10.0, 20.0, 25.0, 27.0, 37.0, 55.0, 85.0, 128.0, 119.0, 139.0, 104.0, 59.0, 40.0, 33.0, 30.0, 12.0, 14.0, 7.0, 10.0, 10.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0], "bins": [-50.71875, -49.5869140625, -48.455078125, -47.3232421875, -46.19140625, -45.0595703125, -43.927734375, -42.7958984375, -41.6640625, -40.5322265625, -39.400390625, -38.2685546875, -37.13671875, -36.0048828125, -34.873046875, -33.7412109375, -32.609375, -31.4775390625, -30.345703125, -29.2138671875, -28.08203125, -26.9501953125, -25.818359375, -24.6865234375, -23.5546875, -22.4228515625, -21.291015625, -20.1591796875, -19.02734375, -17.8955078125, -16.763671875, -15.6318359375, -14.5, -13.3681640625, -12.236328125, -11.1044921875, -9.97265625, -8.8408203125, -7.708984375, -6.5771484375, -5.4453125, -4.3134765625, -3.181640625, -2.0498046875, -0.91796875, 0.2138671875, 1.345703125, 2.4775390625, 3.609375, 4.7412109375, 5.873046875, 7.0048828125, 8.13671875, 9.2685546875, 10.400390625, 11.5322265625, 12.6640625, 13.7958984375, 14.927734375, 16.0595703125, 17.19140625, 18.3232421875, 19.455078125, 20.5869140625, 21.71875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 17.0, 31.0, 70.0, 117.0, 223.0, 245.0, 134.0, 74.0, 40.0, 24.0, 14.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-513.3226318359375, -490.0787048339844, -466.83477783203125, -443.5908508300781, -420.346923828125, -397.1029968261719, -373.85906982421875, -350.6151428222656, -327.3712158203125, -304.1272888183594, -280.88336181640625, -257.6394348144531, -234.3955078125, -211.15158081054688, -187.90765380859375, -164.66372680664062, -141.4197998046875, -118.17587280273438, -94.93194580078125, -71.68801879882812, -48.444091796875, -25.200164794921875, -1.95623779296875, 21.287689208984375, 44.5316162109375, 67.77554321289062, 91.01947021484375, 114.26339721679688, 137.50732421875, 160.75125122070312, 183.99517822265625, 207.23910522460938, 230.48297119140625, 253.72689819335938, 276.9708251953125, 300.2147521972656, 323.45867919921875, 346.7026062011719, 369.946533203125, 393.1904602050781, 416.43438720703125, 439.6783142089844, 462.9222412109375, 486.1661682128906, 509.41009521484375, 532.654052734375, 555.89794921875, 579.141845703125, 602.3858032226562, 625.6297607421875, 648.8736572265625, 672.1175537109375, 695.3615112304688, 718.60546875, 741.849365234375, 765.09326171875, 788.3372192382812, 811.5811767578125, 834.8250732421875, 858.0689697265625, 881.3129272460938, 904.556884765625, 927.80078125, 951.044677734375, 974.2886352539062]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 6.0, 8.0, 7.0, 8.0, 6.0, 6.0, 11.0, 17.0, 17.0, 18.0, 18.0, 27.0, 27.0, 36.0, 29.0, 27.0, 41.0, 33.0, 39.0, 37.0, 37.0, 34.0, 43.0, 49.0, 39.0, 29.0, 37.0, 37.0, 36.0, 38.0, 25.0, 35.0, 23.0, 16.0, 14.0, 22.0, 14.0, 12.0, 10.0, 7.0, 8.0, 4.0, 7.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-231.47592163085938, -224.01959228515625, -216.56326293945312, -209.10693359375, -201.65060424804688, -194.19427490234375, -186.7379608154297, -179.28163146972656, -171.82530212402344, -164.3689727783203, -156.9126434326172, -149.45631408691406, -142.0, -134.54367065429688, -127.08734130859375, -119.63101196289062, -112.1746826171875, -104.71835327148438, -97.26202392578125, -89.80570220947266, -82.34937286376953, -74.8930435180664, -67.43672180175781, -59.98039245605469, -52.52406311035156, -45.06773376464844, -37.61140823364258, -30.155080795288086, -22.698753356933594, -15.242424011230469, -7.786098480224609, -0.32977294921875, 7.1265411376953125, 14.582868576049805, 22.039196014404297, 29.49552345275879, 36.95185089111328, 44.408180236816406, 51.864505767822266, 59.320831298828125, 66.77716064453125, 74.23348999023438, 81.6898193359375, 89.1461410522461, 96.60247039794922, 104.05879974365234, 111.51512145996094, 118.97145080566406, 126.42778015136719, 133.8841094970703, 141.34043884277344, 148.79676818847656, 156.25308227539062, 163.70941162109375, 171.16574096679688, 178.6220703125, 186.07839965820312, 193.53472900390625, 200.99105834960938, 208.4473876953125, 215.90371704101562, 223.36004638671875, 230.8163604736328, 238.27268981933594, 245.72901916503906]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 6.0, 3.0, 10.0, 12.0, 15.0, 30.0, 21.0, 25.0, 47.0, 59.0, 108.0, 122.0, 185.0, 256.0, 430.0, 586.0, 877.0, 1468.0, 2196.0, 3465.0, 5841.0, 10236.0, 20586.0, 49430.0, 230667.0, 3662883.0, 128489.0, 37181.0, 16639.0, 8755.0, 5070.0, 3067.0, 1899.0, 1202.0, 843.0, 520.0, 331.0, 233.0, 133.0, 114.0, 78.0, 49.0, 35.0, 26.0, 10.0, 18.0, 9.0, 7.0, 8.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-49.21875, -47.7861328125, -46.353515625, -44.9208984375, -43.48828125, -42.0556640625, -40.623046875, -39.1904296875, -37.7578125, -36.3251953125, -34.892578125, -33.4599609375, -32.02734375, -30.5947265625, -29.162109375, -27.7294921875, -26.296875, -24.8642578125, -23.431640625, -21.9990234375, -20.56640625, -19.1337890625, -17.701171875, -16.2685546875, -14.8359375, -13.4033203125, -11.970703125, -10.5380859375, -9.10546875, -7.6728515625, -6.240234375, -4.8076171875, -3.375, -1.9423828125, -0.509765625, 0.9228515625, 2.35546875, 3.7880859375, 5.220703125, 6.6533203125, 8.0859375, 9.5185546875, 10.951171875, 12.3837890625, 13.81640625, 15.2490234375, 16.681640625, 18.1142578125, 19.546875, 20.9794921875, 22.412109375, 23.8447265625, 25.27734375, 26.7099609375, 28.142578125, 29.5751953125, 31.0078125, 32.4404296875, 33.873046875, 35.3056640625, 36.73828125, 38.1708984375, 39.603515625, 41.0361328125, 42.46875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 6.0, 6.0, 8.0, 8.0, 14.0, 20.0, 21.0, 23.0, 26.0, 22.0, 25.0, 21.0, 40.0, 44.0, 46.0, 50.0, 51.0, 32.0, 46.0, 50.0, 37.0, 46.0, 51.0, 38.0, 49.0, 34.0, 26.0, 30.0, 26.0, 19.0, 19.0, 18.0, 9.0, 9.0, 8.0, 2.0, 5.0, 2.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.8984375, -10.5516357421875, -10.204833984375, -9.8580322265625, -9.51123046875, -9.1644287109375, -8.817626953125, -8.4708251953125, -8.1240234375, -7.7772216796875, -7.430419921875, -7.0836181640625, -6.73681640625, -6.3900146484375, -6.043212890625, -5.6964111328125, -5.349609375, -5.0028076171875, -4.656005859375, -4.3092041015625, -3.96240234375, -3.6156005859375, -3.268798828125, -2.9219970703125, -2.5751953125, -2.2283935546875, -1.881591796875, -1.5347900390625, -1.18798828125, -0.8411865234375, -0.494384765625, -0.1475830078125, 0.19921875, 0.5460205078125, 0.892822265625, 1.2396240234375, 1.58642578125, 1.9332275390625, 2.280029296875, 2.6268310546875, 2.9736328125, 3.3204345703125, 3.667236328125, 4.0140380859375, 4.36083984375, 4.7076416015625, 5.054443359375, 5.4012451171875, 5.748046875, 6.0948486328125, 6.441650390625, 6.7884521484375, 7.13525390625, 7.4820556640625, 7.828857421875, 8.1756591796875, 8.5224609375, 8.8692626953125, 9.216064453125, 9.5628662109375, 9.90966796875, 10.2564697265625, 10.603271484375, 10.9500732421875, 11.296875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 4.0, 10.0, 9.0, 7.0, 16.0, 17.0, 29.0, 37.0, 60.0, 90.0, 158.0, 335.0, 762.0, 1921.0, 4984.0, 17837.0, 119493.0, 3890472.0, 130511.0, 18704.0, 5279.0, 1984.0, 785.0, 345.0, 155.0, 86.0, 48.0, 40.0, 30.0, 24.0, 15.0, 12.0, 9.0, 8.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-99.0, -95.755859375, -92.51171875, -89.267578125, -86.0234375, -82.779296875, -79.53515625, -76.291015625, -73.046875, -69.802734375, -66.55859375, -63.314453125, -60.0703125, -56.826171875, -53.58203125, -50.337890625, -47.09375, -43.849609375, -40.60546875, -37.361328125, -34.1171875, -30.873046875, -27.62890625, -24.384765625, -21.140625, -17.896484375, -14.65234375, -11.408203125, -8.1640625, -4.919921875, -1.67578125, 1.568359375, 4.8125, 8.056640625, 11.30078125, 14.544921875, 17.7890625, 21.033203125, 24.27734375, 27.521484375, 30.765625, 34.009765625, 37.25390625, 40.498046875, 43.7421875, 46.986328125, 50.23046875, 53.474609375, 56.71875, 59.962890625, 63.20703125, 66.451171875, 69.6953125, 72.939453125, 76.18359375, 79.427734375, 82.671875, 85.916015625, 89.16015625, 92.404296875, 95.6484375, 98.892578125, 102.13671875, 105.380859375, 108.625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 7.0, 3.0, 5.0, 5.0, 10.0, 20.0, 27.0, 52.0, 92.0, 234.0, 2323.0, 983.0, 151.0, 62.0, 38.0, 28.0, 13.0, 6.0, 8.0, 4.0, 3.0, 3.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.203125, -28.416748046875, -26.63037109375, -24.843994140625, -23.0576171875, -21.271240234375, -19.48486328125, -17.698486328125, -15.912109375, -14.125732421875, -12.33935546875, -10.552978515625, -8.7666015625, -6.980224609375, -5.19384765625, -3.407470703125, -1.62109375, 0.165283203125, 1.95166015625, 3.738037109375, 5.5244140625, 7.310791015625, 9.09716796875, 10.883544921875, 12.669921875, 14.456298828125, 16.24267578125, 18.029052734375, 19.8154296875, 21.601806640625, 23.38818359375, 25.174560546875, 26.9609375, 28.747314453125, 30.53369140625, 32.320068359375, 34.1064453125, 35.892822265625, 37.67919921875, 39.465576171875, 41.251953125, 43.038330078125, 44.82470703125, 46.611083984375, 48.3974609375, 50.183837890625, 51.97021484375, 53.756591796875, 55.54296875, 57.329345703125, 59.11572265625, 60.902099609375, 62.6884765625, 64.474853515625, 66.26123046875, 68.047607421875, 69.833984375, 71.620361328125, 73.40673828125, 75.193115234375, 76.9794921875, 78.765869140625, 80.55224609375, 82.338623046875, 84.125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 6.0, 20.0, 54.0, 133.0, 312.0, 284.0, 133.0, 40.0, 14.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-581.3467407226562, -568.4652709960938, -555.5838012695312, -542.7023315429688, -529.8209228515625, -516.939453125, -504.0579833984375, -491.176513671875, -478.2950439453125, -465.41357421875, -452.5321044921875, -439.6506652832031, -426.7691955566406, -413.8877258300781, -401.00628662109375, -388.12481689453125, -375.24334716796875, -362.36187744140625, -349.48040771484375, -336.5989685058594, -323.7174987792969, -310.8360290527344, -297.95458984375, -285.0731201171875, -272.191650390625, -259.3101806640625, -246.42872619628906, -233.54727172851562, -220.66580200195312, -207.78433227539062, -194.9028778076172, -182.02142333984375, -169.1399688720703, -156.25851440429688, -143.37704467773438, -130.49557495117188, -117.61412048339844, -104.73265838623047, -91.8511962890625, -78.96973419189453, -66.08827209472656, -53.206809997558594, -40.325347900390625, -27.443885803222656, -14.562423706054688, -1.6809616088867188, 11.20050048828125, 24.08196258544922, 36.96342468261719, 49.844886779785156, 62.726348876953125, 75.6078109741211, 88.48927307128906, 101.37073516845703, 114.252197265625, 127.13365936279297, 140.01512145996094, 152.89657592773438, 165.77804565429688, 178.65951538085938, 191.5409698486328, 204.42242431640625, 217.30389404296875, 230.18536376953125, 243.0668182373047]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 6.0, 2.0, 4.0, 4.0, 7.0, 12.0, 18.0, 28.0, 24.0, 29.0, 45.0, 29.0, 37.0, 54.0, 52.0, 55.0, 56.0, 65.0, 55.0, 73.0, 44.0, 51.0, 46.0, 37.0, 38.0, 37.0, 32.0, 15.0, 17.0, 11.0, 9.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-146.84996032714844, -142.70748901367188, -138.56500244140625, -134.4225311279297, -130.28005981445312, -126.1375732421875, -121.99510192871094, -117.85262298583984, -113.71014404296875, -109.56766510009766, -105.42518615722656, -101.28271484375, -97.1402359008789, -92.99775695800781, -88.85528564453125, -84.71280670166016, -80.57032775878906, -76.42784881591797, -72.28536987304688, -68.14289855957031, -64.00041961669922, -59.857940673828125, -55.7154655456543, -51.57299041748047, -47.430511474609375, -43.28803253173828, -39.14555740356445, -35.003082275390625, -30.86060333251953, -26.71812629699707, -22.57564926147461, -18.43317222595215, -14.290679931640625, -10.148202896118164, -6.005725860595703, -1.8632488250732422, 2.2792282104492188, 6.42170524597168, 10.56418228149414, 14.706659317016602, 18.849136352539062, 22.991613388061523, 27.134090423583984, 31.276567459106445, 35.419044494628906, 39.5615234375, 43.70399856567383, 47.846473693847656, 51.98895263671875, 56.131431579589844, 60.27390670776367, 64.4163818359375, 68.5588607788086, 72.70133972167969, 76.84381103515625, 80.98628997802734, 85.12876892089844, 89.27124786376953, 93.41372680664062, 97.55619812011719, 101.69867706298828, 105.84115600585938, 109.98362731933594, 114.12610626220703, 118.26858520507812]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 10.0, 19.0, 33.0, 33.0, 48.0, 85.0, 154.0, 234.0, 432.0, 764.0, 1299.0, 2159.0, 3815.0, 6650.0, 11892.0, 22667.0, 46114.0, 106566.0, 261355.0, 320128.0, 142507.0, 59677.0, 28450.0, 14583.0, 8182.0, 4372.0, 2575.0, 1488.0, 922.0, 493.0, 311.0, 197.0, 123.0, 92.0, 50.0, 30.0, 12.0, 11.0, 5.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-47.84375, -46.203125, -44.5625, -42.921875, -41.28125, -39.640625, -38.0, -36.359375, -34.71875, -33.078125, -31.4375, -29.796875, -28.15625, -26.515625, -24.875, -23.234375, -21.59375, -19.953125, -18.3125, -16.671875, -15.03125, -13.390625, -11.75, -10.109375, -8.46875, -6.828125, -5.1875, -3.546875, -1.90625, -0.265625, 1.375, 3.015625, 4.65625, 6.296875, 7.9375, 9.578125, 11.21875, 12.859375, 14.5, 16.140625, 17.78125, 19.421875, 21.0625, 22.703125, 24.34375, 25.984375, 27.625, 29.265625, 30.90625, 32.546875, 34.1875, 35.828125, 37.46875, 39.109375, 40.75, 42.390625, 44.03125, 45.671875, 47.3125, 48.953125, 50.59375, 52.234375, 53.875, 55.515625, 57.15625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 0.0, 4.0, 5.0, 5.0, 5.0, 14.0, 10.0, 20.0, 15.0, 20.0, 25.0, 24.0, 31.0, 26.0, 33.0, 34.0, 33.0, 36.0, 56.0, 46.0, 38.0, 43.0, 40.0, 44.0, 34.0, 40.0, 34.0, 39.0, 36.0, 28.0, 29.0, 20.0, 20.0, 21.0, 22.0, 10.0, 10.0, 9.0, 6.0, 8.0, 10.0, 5.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-12.4296875, -12.0699462890625, -11.710205078125, -11.3504638671875, -10.99072265625, -10.6309814453125, -10.271240234375, -9.9114990234375, -9.5517578125, -9.1920166015625, -8.832275390625, -8.4725341796875, -8.11279296875, -7.7530517578125, -7.393310546875, -7.0335693359375, -6.673828125, -6.3140869140625, -5.954345703125, -5.5946044921875, -5.23486328125, -4.8751220703125, -4.515380859375, -4.1556396484375, -3.7958984375, -3.4361572265625, -3.076416015625, -2.7166748046875, -2.35693359375, -1.9971923828125, -1.637451171875, -1.2777099609375, -0.91796875, -0.5582275390625, -0.198486328125, 0.1612548828125, 0.52099609375, 0.8807373046875, 1.240478515625, 1.6002197265625, 1.9599609375, 2.3197021484375, 2.679443359375, 3.0391845703125, 3.39892578125, 3.7586669921875, 4.118408203125, 4.4781494140625, 4.837890625, 5.1976318359375, 5.557373046875, 5.9171142578125, 6.27685546875, 6.6365966796875, 6.996337890625, 7.3560791015625, 7.7158203125, 8.0755615234375, 8.435302734375, 8.7950439453125, 9.15478515625, 9.5145263671875, 9.874267578125, 10.2340087890625, 10.59375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 4.0, 9.0, 9.0, 7.0, 8.0, 25.0, 31.0, 53.0, 92.0, 105.0, 187.0, 321.0, 655.0, 1647.0, 5492.0, 26317.0, 255127.0, 682616.0, 60946.0, 10313.0, 2521.0, 983.0, 432.0, 209.0, 127.0, 103.0, 56.0, 56.0, 24.0, 17.0, 17.0, 13.0, 6.0, 7.0, 3.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-169.125, -163.875, -158.625, -153.375, -148.125, -142.875, -137.625, -132.375, -127.125, -121.875, -116.625, -111.375, -106.125, -100.875, -95.625, -90.375, -85.125, -79.875, -74.625, -69.375, -64.125, -58.875, -53.625, -48.375, -43.125, -37.875, -32.625, -27.375, -22.125, -16.875, -11.625, -6.375, -1.125, 4.125, 9.375, 14.625, 19.875, 25.125, 30.375, 35.625, 40.875, 46.125, 51.375, 56.625, 61.875, 67.125, 72.375, 77.625, 82.875, 88.125, 93.375, 98.625, 103.875, 109.125, 114.375, 119.625, 124.875, 130.125, 135.375, 140.625, 145.875, 151.125, 156.375, 161.625, 166.875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 3.0, 5.0, 4.0, 3.0, 8.0, 11.0, 7.0, 13.0, 21.0, 22.0, 24.0, 19.0, 29.0, 40.0, 39.0, 38.0, 59.0, 60.0, 58.0, 41.0, 38.0, 45.0, 49.0, 44.0, 44.0, 34.0, 29.0, 30.0, 24.0, 33.0, 18.0, 22.0, 15.0, 15.0, 13.0, 9.0, 9.0, 6.0, 3.0, 5.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-72.1875, -69.7265625, -67.265625, -64.8046875, -62.34375, -59.8828125, -57.421875, -54.9609375, -52.5, -50.0390625, -47.578125, -45.1171875, -42.65625, -40.1953125, -37.734375, -35.2734375, -32.8125, -30.3515625, -27.890625, -25.4296875, -22.96875, -20.5078125, -18.046875, -15.5859375, -13.125, -10.6640625, -8.203125, -5.7421875, -3.28125, -0.8203125, 1.640625, 4.1015625, 6.5625, 9.0234375, 11.484375, 13.9453125, 16.40625, 18.8671875, 21.328125, 23.7890625, 26.25, 28.7109375, 31.171875, 33.6328125, 36.09375, 38.5546875, 41.015625, 43.4765625, 45.9375, 48.3984375, 50.859375, 53.3203125, 55.78125, 58.2421875, 60.703125, 63.1640625, 65.625, 68.0859375, 70.546875, 73.0078125, 75.46875, 77.9296875, 80.390625, 82.8515625, 85.3125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 8.0, 6.0, 9.0, 11.0, 20.0, 33.0, 39.0, 60.0, 92.0, 124.0, 165.0, 304.0, 525.0, 790.0, 1482.0, 2573.0, 4784.0, 9681.0, 21106.0, 55584.0, 199174.0, 500525.0, 165172.0, 48426.0, 19017.0, 8614.0, 4349.0, 2409.0, 1397.0, 792.0, 457.0, 295.0, 201.0, 110.0, 70.0, 51.0, 37.0, 19.0, 15.0, 12.0, 6.0, 8.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-37.875, -36.80615234375, -35.7373046875, -34.66845703125, -33.599609375, -32.53076171875, -31.4619140625, -30.39306640625, -29.32421875, -28.25537109375, -27.1865234375, -26.11767578125, -25.048828125, -23.97998046875, -22.9111328125, -21.84228515625, -20.7734375, -19.70458984375, -18.6357421875, -17.56689453125, -16.498046875, -15.42919921875, -14.3603515625, -13.29150390625, -12.22265625, -11.15380859375, -10.0849609375, -9.01611328125, -7.947265625, -6.87841796875, -5.8095703125, -4.74072265625, -3.671875, -2.60302734375, -1.5341796875, -0.46533203125, 0.603515625, 1.67236328125, 2.7412109375, 3.81005859375, 4.87890625, 5.94775390625, 7.0166015625, 8.08544921875, 9.154296875, 10.22314453125, 11.2919921875, 12.36083984375, 13.4296875, 14.49853515625, 15.5673828125, 16.63623046875, 17.705078125, 18.77392578125, 19.8427734375, 20.91162109375, 21.98046875, 23.04931640625, 24.1181640625, 25.18701171875, 26.255859375, 27.32470703125, 28.3935546875, 29.46240234375, 30.53125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 4.0, 8.0, 5.0, 8.0, 15.0, 17.0, 31.0, 30.0, 80.0, 71.0, 107.0, 131.0, 142.0, 101.0, 63.0, 67.0, 31.0, 20.0, 15.0, 13.0, 9.0, 4.0, 7.0, 3.0, 4.0, 1.0, 0.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00872802734375, -0.008462667465209961, -0.008197307586669922, -0.007931947708129883, -0.007666587829589844, -0.007401227951049805, -0.007135868072509766, -0.0068705081939697266, -0.0066051483154296875, -0.0063397884368896484, -0.006074428558349609, -0.00580906867980957, -0.005543708801269531, -0.005278348922729492, -0.005012989044189453, -0.004747629165649414, -0.004482269287109375, -0.004216909408569336, -0.003951549530029297, -0.003686189651489258, -0.0034208297729492188, -0.0031554698944091797, -0.0028901100158691406, -0.0026247501373291016, -0.0023593902587890625, -0.0020940303802490234, -0.0018286705017089844, -0.0015633106231689453, -0.0012979507446289062, -0.0010325908660888672, -0.0007672309875488281, -0.0005018711090087891, -0.00023651123046875, 2.8848648071289062e-05, 0.0002942085266113281, 0.0005595684051513672, 0.0008249282836914062, 0.0010902881622314453, 0.0013556480407714844, 0.0016210079193115234, 0.0018863677978515625, 0.0021517276763916016, 0.0024170875549316406, 0.0026824474334716797, 0.0029478073120117188, 0.003213167190551758, 0.003478527069091797, 0.003743886947631836, 0.004009246826171875, 0.004274606704711914, 0.004539966583251953, 0.004805326461791992, 0.005070686340332031, 0.00533604621887207, 0.005601406097412109, 0.0058667659759521484, 0.0061321258544921875, 0.0063974857330322266, 0.006662845611572266, 0.006928205490112305, 0.007193565368652344, 0.007458925247192383, 0.007724285125732422, 0.007989645004272461, 0.0082550048828125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 9.0, 20.0, 33.0, 37.0, 104.0, 167.0, 368.0, 1078.0, 5664.0, 132967.0, 880650.0, 23891.0, 2395.0, 639.0, 259.0, 124.0, 56.0, 38.0, 21.0, 12.0, 10.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.0, -80.5390625, -77.078125, -73.6171875, -70.15625, -66.6953125, -63.234375, -59.7734375, -56.3125, -52.8515625, -49.390625, -45.9296875, -42.46875, -39.0078125, -35.546875, -32.0859375, -28.625, -25.1640625, -21.703125, -18.2421875, -14.78125, -11.3203125, -7.859375, -4.3984375, -0.9375, 2.5234375, 5.984375, 9.4453125, 12.90625, 16.3671875, 19.828125, 23.2890625, 26.75, 30.2109375, 33.671875, 37.1328125, 40.59375, 44.0546875, 47.515625, 50.9765625, 54.4375, 57.8984375, 61.359375, 64.8203125, 68.28125, 71.7421875, 75.203125, 78.6640625, 82.125, 85.5859375, 89.046875, 92.5078125, 95.96875, 99.4296875, 102.890625, 106.3515625, 109.8125, 113.2734375, 116.734375, 120.1953125, 123.65625, 127.1171875, 130.578125, 134.0390625, 137.5]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 1.0, 3.0, 6.0, 7.0, 6.0, 16.0, 15.0, 17.0, 20.0, 19.0, 30.0, 34.0, 53.0, 43.0, 65.0, 82.0, 97.0, 121.0, 83.0, 60.0, 43.0, 47.0, 34.0, 15.0, 26.0, 14.0, 8.0, 10.0, 11.0, 10.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.21875, -32.83837890625, -31.4580078125, -30.07763671875, -28.697265625, -27.31689453125, -25.9365234375, -24.55615234375, -23.17578125, -21.79541015625, -20.4150390625, -19.03466796875, -17.654296875, -16.27392578125, -14.8935546875, -13.51318359375, -12.1328125, -10.75244140625, -9.3720703125, -7.99169921875, -6.611328125, -5.23095703125, -3.8505859375, -2.47021484375, -1.08984375, 0.29052734375, 1.6708984375, 3.05126953125, 4.431640625, 5.81201171875, 7.1923828125, 8.57275390625, 9.953125, 11.33349609375, 12.7138671875, 14.09423828125, 15.474609375, 16.85498046875, 18.2353515625, 19.61572265625, 20.99609375, 22.37646484375, 23.7568359375, 25.13720703125, 26.517578125, 27.89794921875, 29.2783203125, 30.65869140625, 32.0390625, 33.41943359375, 34.7998046875, 36.18017578125, 37.560546875, 38.94091796875, 40.3212890625, 41.70166015625, 43.08203125, 44.46240234375, 45.8427734375, 47.22314453125, 48.603515625, 49.98388671875, 51.3642578125, 52.74462890625, 54.125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 13.0, 26.0, 80.0, 228.0, 359.0, 184.0, 69.0, 23.0, 14.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1172.158447265625, -1114.5994873046875, -1057.04052734375, -999.4815673828125, -941.922607421875, -884.3636474609375, -826.8046264648438, -769.2456665039062, -711.6867065429688, -654.1277465820312, -596.5687866210938, -539.009765625, -481.4508361816406, -423.8918762207031, -366.3328857421875, -308.77392578125, -251.2149658203125, -193.656005859375, -136.09703063964844, -78.53805541992188, -20.979095458984375, 36.579864501953125, 94.13885498046875, 151.69781494140625, 209.25677490234375, 266.81573486328125, 324.37469482421875, 381.9336853027344, 439.4926452636719, 497.0516052246094, 554.610595703125, 612.1695556640625, 669.728515625, 727.2874755859375, 784.846435546875, 842.4053955078125, 899.96435546875, 957.5233154296875, 1015.0823364257812, 1072.641357421875, 1130.2001953125, 1187.7591552734375, 1245.318115234375, 1302.8770751953125, 1360.43603515625, 1417.9949951171875, 1475.553955078125, 1533.113037109375, 1590.6719970703125, 1648.23095703125, 1705.7899169921875, 1763.348876953125, 1820.9078369140625, 1878.466796875, 1936.02587890625, 1993.584716796875, 2051.143798828125, 2108.702880859375, 2166.26171875, 2223.82080078125, 2281.379638671875, 2338.938720703125, 2396.49755859375, 2454.056640625, 2511.615478515625]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 8.0, 13.0, 9.0, 8.0, 11.0, 18.0, 17.0, 13.0, 25.0, 38.0, 23.0, 36.0, 39.0, 30.0, 55.0, 32.0, 35.0, 47.0, 44.0, 54.0, 45.0, 33.0, 39.0, 40.0, 40.0, 28.0, 28.0, 27.0, 20.0, 18.0, 20.0, 13.0, 19.0, 9.0, 11.0, 9.0, 9.0, 8.0, 9.0, 3.0, 5.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-430.1987609863281, -417.0608825683594, -403.9230041503906, -390.7851257324219, -377.6472473144531, -364.5093688964844, -351.37152099609375, -338.233642578125, -325.09576416015625, -311.9578857421875, -298.82000732421875, -285.68212890625, -272.54425048828125, -259.4063720703125, -246.2685089111328, -233.13063049316406, -219.99273681640625, -206.8548583984375, -193.71697998046875, -180.5791015625, -167.44122314453125, -154.3033447265625, -141.1654815673828, -128.02760314941406, -114.88972473144531, -101.75184631347656, -88.61396789550781, -75.4760971069336, -62.338218688964844, -49.200340270996094, -36.062469482421875, -22.924591064453125, -9.7867431640625, 3.351133346557617, 16.489009857177734, 29.62688446044922, 42.76476287841797, 55.90264129638672, 69.04051208496094, 82.17839050292969, 95.31626892089844, 108.45414733886719, 121.59202575683594, 134.72988891601562, 147.86776733398438, 161.00564575195312, 174.14352416992188, 187.28140258789062, 200.41928100585938, 213.55715942382812, 226.69503784179688, 239.83291625976562, 252.97079467773438, 266.1086730957031, 279.24652099609375, 292.3843994140625, 305.52227783203125, 318.66015625, 331.79803466796875, 344.9359130859375, 358.07379150390625, 371.211669921875, 384.34954833984375, 397.4874267578125, 410.62530517578125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 1.0, 4.0, 7.0, 9.0, 13.0, 20.0, 31.0, 34.0, 55.0, 102.0, 120.0, 238.0, 361.0, 573.0, 1026.0, 2276.0, 11941.0, 4156347.0, 15695.0, 2737.0, 1034.0, 582.0, 342.0, 246.0, 155.0, 112.0, 65.0, 51.0, 31.0, 21.0, 16.0, 9.0, 7.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-159.75, -154.15625, -148.5625, -142.96875, -137.375, -131.78125, -126.1875, -120.59375, -115.0, -109.40625, -103.8125, -98.21875, -92.625, -87.03125, -81.4375, -75.84375, -70.25, -64.65625, -59.0625, -53.46875, -47.875, -42.28125, -36.6875, -31.09375, -25.5, -19.90625, -14.3125, -8.71875, -3.125, 2.46875, 8.0625, 13.65625, 19.25, 24.84375, 30.4375, 36.03125, 41.625, 47.21875, 52.8125, 58.40625, 64.0, 69.59375, 75.1875, 80.78125, 86.375, 91.96875, 97.5625, 103.15625, 108.75, 114.34375, 119.9375, 125.53125, 131.125, 136.71875, 142.3125, 147.90625, 153.5, 159.09375, 164.6875, 170.28125, 175.875, 181.46875, 187.0625, 192.65625, 198.25]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 14.0, 13.0, 24.0, 25.0, 34.0, 33.0, 40.0, 40.0, 50.0, 61.0, 65.0, 60.0, 79.0, 58.0, 53.0, 59.0, 45.0, 38.0, 34.0, 30.0, 26.0, 23.0, 21.0, 14.0, 13.0, 6.0, 11.0, 6.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-28.59375, -27.85009765625, -27.1064453125, -26.36279296875, -25.619140625, -24.87548828125, -24.1318359375, -23.38818359375, -22.64453125, -21.90087890625, -21.1572265625, -20.41357421875, -19.669921875, -18.92626953125, -18.1826171875, -17.43896484375, -16.6953125, -15.95166015625, -15.2080078125, -14.46435546875, -13.720703125, -12.97705078125, -12.2333984375, -11.48974609375, -10.74609375, -10.00244140625, -9.2587890625, -8.51513671875, -7.771484375, -7.02783203125, -6.2841796875, -5.54052734375, -4.796875, -4.05322265625, -3.3095703125, -2.56591796875, -1.822265625, -1.07861328125, -0.3349609375, 0.40869140625, 1.15234375, 1.89599609375, 2.6396484375, 3.38330078125, 4.126953125, 4.87060546875, 5.6142578125, 6.35791015625, 7.1015625, 7.84521484375, 8.5888671875, 9.33251953125, 10.076171875, 10.81982421875, 11.5634765625, 12.30712890625, 13.05078125, 13.79443359375, 14.5380859375, 15.28173828125, 16.025390625, 16.76904296875, 17.5126953125, 18.25634765625, 19.0]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 12.0, 4.0, 14.0, 6.0, 18.0, 12.0, 14.0, 26.0, 37.0, 54.0, 78.0, 107.0, 148.0, 207.0, 330.0, 467.0, 657.0, 1090.0, 1920.0, 3633.0, 8917.0, 54353.0, 4084175.0, 24564.0, 6314.0, 2858.0, 1510.0, 876.0, 610.0, 357.0, 237.0, 170.0, 133.0, 87.0, 82.0, 55.0, 42.0, 33.0, 26.0, 16.0, 13.0, 9.0, 12.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-120.4375, -116.9296875, -113.421875, -109.9140625, -106.40625, -102.8984375, -99.390625, -95.8828125, -92.375, -88.8671875, -85.359375, -81.8515625, -78.34375, -74.8359375, -71.328125, -67.8203125, -64.3125, -60.8046875, -57.296875, -53.7890625, -50.28125, -46.7734375, -43.265625, -39.7578125, -36.25, -32.7421875, -29.234375, -25.7265625, -22.21875, -18.7109375, -15.203125, -11.6953125, -8.1875, -4.6796875, -1.171875, 2.3359375, 5.84375, 9.3515625, 12.859375, 16.3671875, 19.875, 23.3828125, 26.890625, 30.3984375, 33.90625, 37.4140625, 40.921875, 44.4296875, 47.9375, 51.4453125, 54.953125, 58.4609375, 61.96875, 65.4765625, 68.984375, 72.4921875, 76.0, 79.5078125, 83.015625, 86.5234375, 90.03125, 93.5390625, 97.046875, 100.5546875, 104.0625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 2.0, 4.0, 7.0, 10.0, 25.0, 85.0, 3786.0, 84.0, 34.0, 8.0, 7.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.296875, -23.342041015625, -22.38720703125, -21.432373046875, -20.4775390625, -19.522705078125, -18.56787109375, -17.613037109375, -16.658203125, -15.703369140625, -14.74853515625, -13.793701171875, -12.8388671875, -11.884033203125, -10.92919921875, -9.974365234375, -9.01953125, -8.064697265625, -7.10986328125, -6.155029296875, -5.2001953125, -4.245361328125, -3.29052734375, -2.335693359375, -1.380859375, -0.426025390625, 0.52880859375, 1.483642578125, 2.4384765625, 3.393310546875, 4.34814453125, 5.302978515625, 6.2578125, 7.212646484375, 8.16748046875, 9.122314453125, 10.0771484375, 11.031982421875, 11.98681640625, 12.941650390625, 13.896484375, 14.851318359375, 15.80615234375, 16.760986328125, 17.7158203125, 18.670654296875, 19.62548828125, 20.580322265625, 21.53515625, 22.489990234375, 23.44482421875, 24.399658203125, 25.3544921875, 26.309326171875, 27.26416015625, 28.218994140625, 29.173828125, 30.128662109375, 31.08349609375, 32.038330078125, 32.9931640625, 33.947998046875, 34.90283203125, 35.857666015625, 36.8125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 9.0, 26.0, 68.0, 172.0, 255.0, 245.0, 133.0, 55.0, 15.0, 15.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-202.73521423339844, -197.79803466796875, -192.86085510253906, -187.92367553710938, -182.9864959716797, -178.04931640625, -173.1121368408203, -168.17495727539062, -163.23777770996094, -158.30059814453125, -153.36341857910156, -148.42623901367188, -143.4890594482422, -138.5518798828125, -133.6147003173828, -128.67752075195312, -123.74034118652344, -118.80316162109375, -113.86598205566406, -108.92880249023438, -103.99162292480469, -99.054443359375, -94.11726379394531, -89.18008422851562, -84.24290466308594, -79.30572509765625, -74.36854553222656, -69.43136596679688, -64.49418640136719, -59.5570068359375, -54.61982727050781, -49.682647705078125, -44.745460510253906, -39.80828094482422, -34.87110137939453, -29.933921813964844, -24.996742248535156, -20.05956268310547, -15.122383117675781, -10.185203552246094, -5.248023986816406, -0.31084442138671875, 4.626335144042969, 9.563514709472656, 14.500694274902344, 19.43787384033203, 24.37505340576172, 29.312232971191406, 34.249412536621094, 39.18659210205078, 44.12377166748047, 49.060951232910156, 53.998130798339844, 58.93531036376953, 63.87248992919922, 68.8096694946289, 73.7468490600586, 78.68402862548828, 83.62120819091797, 88.55838775634766, 93.49556732177734, 98.43274688720703, 103.36992645263672, 108.3071060180664, 113.2442855834961]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 6.0, 9.0, 8.0, 10.0, 15.0, 11.0, 13.0, 17.0, 21.0, 20.0, 30.0, 26.0, 28.0, 44.0, 47.0, 45.0, 35.0, 40.0, 38.0, 44.0, 44.0, 40.0, 54.0, 33.0, 46.0, 32.0, 31.0, 32.0, 28.0, 29.0, 20.0, 25.0, 18.0, 17.0, 6.0, 13.0, 7.0, 8.0, 4.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.0499267578125, -38.76712417602539, -37.48432159423828, -36.20151901245117, -34.91871643066406, -33.63591384887695, -32.353111267089844, -31.070310592651367, -29.787508010864258, -28.50470542907715, -27.22190284729004, -25.93910026550293, -24.656299591064453, -23.373497009277344, -22.090694427490234, -20.807891845703125, -19.525089263916016, -18.242286682128906, -16.959484100341797, -15.676682472229004, -14.393879890441895, -13.111077308654785, -11.828275680541992, -10.545473098754883, -9.262670516967773, -7.979867935180664, -6.697065830230713, -5.414263725280762, -4.131461143493652, -2.848658561706543, -1.5658564567565918, -0.2830543518066406, 0.9997482299804688, 2.282550573348999, 3.5653529167175293, 4.8481550216674805, 6.13095760345459, 7.413760185241699, 8.696561813354492, 9.979364395141602, 11.262166976928711, 12.54496955871582, 13.82777214050293, 15.110573768615723, 16.393375396728516, 17.676177978515625, 18.958980560302734, 20.241783142089844, 21.524585723876953, 22.807388305664062, 24.090190887451172, 25.37299346923828, 26.65579605102539, 27.9385986328125, 29.221399307250977, 30.504201889038086, 31.787004470825195, 33.06980514526367, 34.35260772705078, 35.63541030883789, 36.918212890625, 38.20101547241211, 39.48381805419922, 40.76662063598633, 42.04942321777344]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 4.0, 2.0, 10.0, 8.0, 11.0, 28.0, 30.0, 50.0, 66.0, 111.0, 154.0, 229.0, 380.0, 552.0, 914.0, 1365.0, 2300.0, 3799.0, 6612.0, 11843.0, 21858.0, 44121.0, 96647.0, 223091.0, 315239.0, 169838.0, 73654.0, 34517.0, 17384.0, 9723.0, 5445.0, 3147.0, 1972.0, 1163.0, 768.0, 479.0, 336.0, 241.0, 153.0, 94.0, 88.0, 45.0, 28.0, 19.0, 8.0, 8.0, 12.0, 8.0, 8.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-60.84375, -58.9619140625, -57.080078125, -55.1982421875, -53.31640625, -51.4345703125, -49.552734375, -47.6708984375, -45.7890625, -43.9072265625, -42.025390625, -40.1435546875, -38.26171875, -36.3798828125, -34.498046875, -32.6162109375, -30.734375, -28.8525390625, -26.970703125, -25.0888671875, -23.20703125, -21.3251953125, -19.443359375, -17.5615234375, -15.6796875, -13.7978515625, -11.916015625, -10.0341796875, -8.15234375, -6.2705078125, -4.388671875, -2.5068359375, -0.625, 1.2568359375, 3.138671875, 5.0205078125, 6.90234375, 8.7841796875, 10.666015625, 12.5478515625, 14.4296875, 16.3115234375, 18.193359375, 20.0751953125, 21.95703125, 23.8388671875, 25.720703125, 27.6025390625, 29.484375, 31.3662109375, 33.248046875, 35.1298828125, 37.01171875, 38.8935546875, 40.775390625, 42.6572265625, 44.5390625, 46.4208984375, 48.302734375, 50.1845703125, 52.06640625, 53.9482421875, 55.830078125, 57.7119140625, 59.59375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 0.0, 3.0, 6.0, 9.0, 12.0, 15.0, 13.0, 22.0, 21.0, 20.0, 16.0, 34.0, 50.0, 48.0, 42.0, 33.0, 62.0, 42.0, 47.0, 58.0, 52.0, 43.0, 40.0, 38.0, 36.0, 43.0, 32.0, 26.0, 22.0, 19.0, 18.0, 16.0, 13.0, 5.0, 12.0, 3.0, 5.0, 3.0, 7.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0], "bins": [-21.984375, -21.357177734375, -20.72998046875, -20.102783203125, -19.4755859375, -18.848388671875, -18.22119140625, -17.593994140625, -16.966796875, -16.339599609375, -15.71240234375, -15.085205078125, -14.4580078125, -13.830810546875, -13.20361328125, -12.576416015625, -11.94921875, -11.322021484375, -10.69482421875, -10.067626953125, -9.4404296875, -8.813232421875, -8.18603515625, -7.558837890625, -6.931640625, -6.304443359375, -5.67724609375, -5.050048828125, -4.4228515625, -3.795654296875, -3.16845703125, -2.541259765625, -1.9140625, -1.286865234375, -0.65966796875, -0.032470703125, 0.5947265625, 1.221923828125, 1.84912109375, 2.476318359375, 3.103515625, 3.730712890625, 4.35791015625, 4.985107421875, 5.6123046875, 6.239501953125, 6.86669921875, 7.493896484375, 8.12109375, 8.748291015625, 9.37548828125, 10.002685546875, 10.6298828125, 11.257080078125, 11.88427734375, 12.511474609375, 13.138671875, 13.765869140625, 14.39306640625, 15.020263671875, 15.6474609375, 16.274658203125, 16.90185546875, 17.529052734375, 18.15625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 7.0, 12.0, 6.0, 15.0, 20.0, 22.0, 30.0, 43.0, 71.0, 102.0, 151.0, 235.0, 362.0, 704.0, 2004.0, 7791.0, 54712.0, 739928.0, 216115.0, 19773.0, 3868.0, 1150.0, 553.0, 284.0, 166.0, 113.0, 90.0, 68.0, 57.0, 35.0, 15.0, 12.0, 6.0, 15.0, 7.0, 3.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-212.375, -205.470703125, -198.56640625, -191.662109375, -184.7578125, -177.853515625, -170.94921875, -164.044921875, -157.140625, -150.236328125, -143.33203125, -136.427734375, -129.5234375, -122.619140625, -115.71484375, -108.810546875, -101.90625, -95.001953125, -88.09765625, -81.193359375, -74.2890625, -67.384765625, -60.48046875, -53.576171875, -46.671875, -39.767578125, -32.86328125, -25.958984375, -19.0546875, -12.150390625, -5.24609375, 1.658203125, 8.5625, 15.466796875, 22.37109375, 29.275390625, 36.1796875, 43.083984375, 49.98828125, 56.892578125, 63.796875, 70.701171875, 77.60546875, 84.509765625, 91.4140625, 98.318359375, 105.22265625, 112.126953125, 119.03125, 125.935546875, 132.83984375, 139.744140625, 146.6484375, 153.552734375, 160.45703125, 167.361328125, 174.265625, 181.169921875, 188.07421875, 194.978515625, 201.8828125, 208.787109375, 215.69140625, 222.595703125, 229.5]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 7.0, 4.0, 4.0, 14.0, 10.0, 12.0, 18.0, 25.0, 25.0, 36.0, 38.0, 41.0, 48.0, 39.0, 60.0, 40.0, 52.0, 64.0, 60.0, 43.0, 68.0, 51.0, 45.0, 23.0, 36.0, 31.0, 24.0, 19.0, 12.0, 16.0, 10.0, 7.0, 4.0, 7.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.0625, -113.9775390625, -109.892578125, -105.8076171875, -101.72265625, -97.6376953125, -93.552734375, -89.4677734375, -85.3828125, -81.2978515625, -77.212890625, -73.1279296875, -69.04296875, -64.9580078125, -60.873046875, -56.7880859375, -52.703125, -48.6181640625, -44.533203125, -40.4482421875, -36.36328125, -32.2783203125, -28.193359375, -24.1083984375, -20.0234375, -15.9384765625, -11.853515625, -7.7685546875, -3.68359375, 0.4013671875, 4.486328125, 8.5712890625, 12.65625, 16.7412109375, 20.826171875, 24.9111328125, 28.99609375, 33.0810546875, 37.166015625, 41.2509765625, 45.3359375, 49.4208984375, 53.505859375, 57.5908203125, 61.67578125, 65.7607421875, 69.845703125, 73.9306640625, 78.015625, 82.1005859375, 86.185546875, 90.2705078125, 94.35546875, 98.4404296875, 102.525390625, 106.6103515625, 110.6953125, 114.7802734375, 118.865234375, 122.9501953125, 127.03515625, 131.1201171875, 135.205078125, 139.2900390625, 143.375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 11.0, 16.0, 20.0, 39.0, 67.0, 88.0, 211.0, 380.0, 858.0, 2285.0, 7691.0, 40483.0, 581872.0, 374615.0, 30109.0, 6369.0, 1961.0, 737.0, 338.0, 171.0, 87.0, 53.0, 37.0, 23.0, 10.0, 11.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.25, -72.6484375, -70.046875, -67.4453125, -64.84375, -62.2421875, -59.640625, -57.0390625, -54.4375, -51.8359375, -49.234375, -46.6328125, -44.03125, -41.4296875, -38.828125, -36.2265625, -33.625, -31.0234375, -28.421875, -25.8203125, -23.21875, -20.6171875, -18.015625, -15.4140625, -12.8125, -10.2109375, -7.609375, -5.0078125, -2.40625, 0.1953125, 2.796875, 5.3984375, 8.0, 10.6015625, 13.203125, 15.8046875, 18.40625, 21.0078125, 23.609375, 26.2109375, 28.8125, 31.4140625, 34.015625, 36.6171875, 39.21875, 41.8203125, 44.421875, 47.0234375, 49.625, 52.2265625, 54.828125, 57.4296875, 60.03125, 62.6328125, 65.234375, 67.8359375, 70.4375, 73.0390625, 75.640625, 78.2421875, 80.84375, 83.4453125, 86.046875, 88.6484375, 91.25]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 7.0, 6.0, 5.0, 8.0, 9.0, 5.0, 9.0, 19.0, 40.0, 71.0, 60.0, 73.0, 121.0, 144.0, 119.0, 101.0, 66.0, 34.0, 31.0, 26.0, 12.0, 7.0, 4.0, 3.0, 6.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0123291015625, -0.012009859085083008, -0.011690616607666016, -0.011371374130249023, -0.011052131652832031, -0.010732889175415039, -0.010413646697998047, -0.010094404220581055, -0.009775161743164062, -0.00945591926574707, -0.009136676788330078, -0.008817434310913086, -0.008498191833496094, -0.008178949356079102, -0.00785970687866211, -0.007540464401245117, -0.007221221923828125, -0.006901979446411133, -0.006582736968994141, -0.0062634944915771484, -0.005944252014160156, -0.005625009536743164, -0.005305767059326172, -0.00498652458190918, -0.0046672821044921875, -0.004348039627075195, -0.004028797149658203, -0.003709554672241211, -0.0033903121948242188, -0.0030710697174072266, -0.0027518272399902344, -0.002432584762573242, -0.00211334228515625, -0.0017940998077392578, -0.0014748573303222656, -0.0011556148529052734, -0.0008363723754882812, -0.0005171298980712891, -0.00019788742065429688, 0.00012135505676269531, 0.0004405975341796875, 0.0007598400115966797, 0.0010790824890136719, 0.001398324966430664, 0.0017175674438476562, 0.0020368099212646484, 0.0023560523986816406, 0.002675294876098633, 0.002994537353515625, 0.003313779830932617, 0.0036330223083496094, 0.0039522647857666016, 0.004271507263183594, 0.004590749740600586, 0.004909992218017578, 0.00522923469543457, 0.0055484771728515625, 0.005867719650268555, 0.006186962127685547, 0.006506204605102539, 0.006825447082519531, 0.0071446895599365234, 0.007463932037353516, 0.007783174514770508, 0.0081024169921875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 6.0, 7.0, 10.0, 21.0, 19.0, 16.0, 36.0, 56.0, 62.0, 132.0, 201.0, 341.0, 745.0, 2249.0, 8807.0, 65550.0, 815242.0, 136015.0, 13952.0, 3085.0, 962.0, 444.0, 217.0, 114.0, 80.0, 46.0, 48.0, 21.0, 12.0, 10.0, 12.0, 12.0, 8.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.3125, -71.623046875, -68.93359375, -66.244140625, -63.5546875, -60.865234375, -58.17578125, -55.486328125, -52.796875, -50.107421875, -47.41796875, -44.728515625, -42.0390625, -39.349609375, -36.66015625, -33.970703125, -31.28125, -28.591796875, -25.90234375, -23.212890625, -20.5234375, -17.833984375, -15.14453125, -12.455078125, -9.765625, -7.076171875, -4.38671875, -1.697265625, 0.9921875, 3.681640625, 6.37109375, 9.060546875, 11.75, 14.439453125, 17.12890625, 19.818359375, 22.5078125, 25.197265625, 27.88671875, 30.576171875, 33.265625, 35.955078125, 38.64453125, 41.333984375, 44.0234375, 46.712890625, 49.40234375, 52.091796875, 54.78125, 57.470703125, 60.16015625, 62.849609375, 65.5390625, 68.228515625, 70.91796875, 73.607421875, 76.296875, 78.986328125, 81.67578125, 84.365234375, 87.0546875, 89.744140625, 92.43359375, 95.123046875, 97.8125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 9.0, 12.0, 15.0, 9.0, 15.0, 18.0, 26.0, 28.0, 48.0, 61.0, 77.0, 88.0, 98.0, 91.0, 97.0, 76.0, 47.0, 41.0, 28.0, 21.0, 17.0, 14.0, 11.0, 10.0, 6.0, 10.0, 5.0, 3.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.4375, -43.6865234375, -41.935546875, -40.1845703125, -38.43359375, -36.6826171875, -34.931640625, -33.1806640625, -31.4296875, -29.6787109375, -27.927734375, -26.1767578125, -24.42578125, -22.6748046875, -20.923828125, -19.1728515625, -17.421875, -15.6708984375, -13.919921875, -12.1689453125, -10.41796875, -8.6669921875, -6.916015625, -5.1650390625, -3.4140625, -1.6630859375, 0.087890625, 1.8388671875, 3.58984375, 5.3408203125, 7.091796875, 8.8427734375, 10.59375, 12.3447265625, 14.095703125, 15.8466796875, 17.59765625, 19.3486328125, 21.099609375, 22.8505859375, 24.6015625, 26.3525390625, 28.103515625, 29.8544921875, 31.60546875, 33.3564453125, 35.107421875, 36.8583984375, 38.609375, 40.3603515625, 42.111328125, 43.8623046875, 45.61328125, 47.3642578125, 49.115234375, 50.8662109375, 52.6171875, 54.3681640625, 56.119140625, 57.8701171875, 59.62109375, 61.3720703125, 63.123046875, 64.8740234375, 66.625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 10.0, 10.0, 22.0, 56.0, 109.0, 197.0, 268.0, 168.0, 87.0, 35.0, 24.0, 13.0, 8.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1042.6959228515625, -997.990234375, -953.2844848632812, -908.5787353515625, -863.873046875, -819.1673583984375, -774.4616088867188, -729.755859375, -685.0501708984375, -640.344482421875, -595.6387329101562, -550.9329833984375, -506.227294921875, -461.5215759277344, -416.81585693359375, -372.1101379394531, -327.4044189453125, -282.6986999511719, -237.99298095703125, -193.28726196289062, -148.58154296875, -103.87582397460938, -59.17010498046875, -14.464385986328125, 30.2413330078125, 74.94705200195312, 119.65277099609375, 164.35848999023438, 209.064208984375, 253.76992797851562, 298.47564697265625, 343.1813659667969, 387.8870849609375, 432.5928039550781, 477.29852294921875, 522.0042724609375, 566.7099609375, 611.4156494140625, 656.1213989257812, 700.8271484375, 745.5328369140625, 790.238525390625, 834.9442749023438, 879.6500244140625, 924.355712890625, 969.0614013671875, 1013.7671508789062, 1058.472900390625, 1103.1785888671875, 1147.88427734375, 1192.590087890625, 1237.2957763671875, 1282.00146484375, 1326.7071533203125, 1371.412841796875, 1416.11865234375, 1460.8243408203125, 1505.530029296875, 1550.23583984375, 1594.9415283203125, 1639.647216796875, 1684.3529052734375, 1729.05859375, 1773.764404296875, 1818.4700927734375]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 7.0, 9.0, 9.0, 15.0, 14.0, 10.0, 15.0, 19.0, 25.0, 20.0, 22.0, 23.0, 28.0, 36.0, 44.0, 25.0, 37.0, 23.0, 37.0, 28.0, 57.0, 50.0, 42.0, 39.0, 37.0, 30.0, 36.0, 51.0, 26.0, 28.0, 26.0, 19.0, 15.0, 20.0, 11.0, 12.0, 6.0, 11.0, 9.0, 8.0, 3.0, 6.0, 3.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-468.611328125, -454.606689453125, -440.60205078125, -426.597412109375, -412.5927734375, -398.588134765625, -384.58349609375, -370.578857421875, -356.57421875, -342.569580078125, -328.56494140625, -314.560302734375, -300.5556640625, -286.551025390625, -272.54638671875, -258.541748046875, -244.53712463378906, -230.53248596191406, -216.52784729003906, -202.52320861816406, -188.51856994628906, -174.51394653320312, -160.50930786132812, -146.50466918945312, -132.50003051757812, -118.49539184570312, -104.49075317382812, -90.48611450195312, -76.48147583007812, -62.476844787597656, -48.472206115722656, -34.467567443847656, -20.462921142578125, -6.458283424377441, 7.546354293823242, 21.55099105834961, 35.55562973022461, 49.560264587402344, 63.564903259277344, 77.56954193115234, 91.57418060302734, 105.57881927490234, 119.58345794677734, 133.5880889892578, 147.5927276611328, 161.5973663330078, 175.6020050048828, 189.6066436767578, 203.6112823486328, 217.6159210205078, 231.6205596923828, 245.6251983642578, 259.62982177734375, 273.63446044921875, 287.63909912109375, 301.64373779296875, 315.64837646484375, 329.65301513671875, 343.65765380859375, 357.66229248046875, 371.66693115234375, 385.67156982421875, 399.67620849609375, 413.68084716796875, 427.68548583984375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 3.0, 7.0, 5.0, 6.0, 8.0, 19.0, 24.0, 28.0, 65.0, 91.0, 167.0, 333.0, 687.0, 1587.0, 4896.0, 4036977.0, 142169.0, 4365.0, 1426.0, 609.0, 310.0, 187.0, 110.0, 59.0, 36.0, 29.0, 23.0, 15.0, 8.0, 7.0, 7.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-176.25, -169.94921875, -163.6484375, -157.34765625, -151.046875, -144.74609375, -138.4453125, -132.14453125, -125.84375, -119.54296875, -113.2421875, -106.94140625, -100.640625, -94.33984375, -88.0390625, -81.73828125, -75.4375, -69.13671875, -62.8359375, -56.53515625, -50.234375, -43.93359375, -37.6328125, -31.33203125, -25.03125, -18.73046875, -12.4296875, -6.12890625, 0.171875, 6.47265625, 12.7734375, 19.07421875, 25.375, 31.67578125, 37.9765625, 44.27734375, 50.578125, 56.87890625, 63.1796875, 69.48046875, 75.78125, 82.08203125, 88.3828125, 94.68359375, 100.984375, 107.28515625, 113.5859375, 119.88671875, 126.1875, 132.48828125, 138.7890625, 145.08984375, 151.390625, 157.69140625, 163.9921875, 170.29296875, 176.59375, 182.89453125, 189.1953125, 195.49609375, 201.796875, 208.09765625, 214.3984375, 220.69921875, 227.0]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 11.0, 14.0, 12.0, 13.0, 16.0, 22.0, 23.0, 24.0, 31.0, 26.0, 50.0, 40.0, 55.0, 54.0, 37.0, 57.0, 56.0, 62.0, 46.0, 53.0, 43.0, 38.0, 34.0, 28.0, 28.0, 23.0, 21.0, 11.0, 13.0, 11.0, 15.0, 9.0, 3.0, 4.0, 4.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-22.296875, -21.580322265625, -20.86376953125, -20.147216796875, -19.4306640625, -18.714111328125, -17.99755859375, -17.281005859375, -16.564453125, -15.847900390625, -15.13134765625, -14.414794921875, -13.6982421875, -12.981689453125, -12.26513671875, -11.548583984375, -10.83203125, -10.115478515625, -9.39892578125, -8.682373046875, -7.9658203125, -7.249267578125, -6.53271484375, -5.816162109375, -5.099609375, -4.383056640625, -3.66650390625, -2.949951171875, -2.2333984375, -1.516845703125, -0.80029296875, -0.083740234375, 0.6328125, 1.349365234375, 2.06591796875, 2.782470703125, 3.4990234375, 4.215576171875, 4.93212890625, 5.648681640625, 6.365234375, 7.081787109375, 7.79833984375, 8.514892578125, 9.2314453125, 9.947998046875, 10.66455078125, 11.381103515625, 12.09765625, 12.814208984375, 13.53076171875, 14.247314453125, 14.9638671875, 15.680419921875, 16.39697265625, 17.113525390625, 17.830078125, 18.546630859375, 19.26318359375, 19.979736328125, 20.6962890625, 21.412841796875, 22.12939453125, 22.845947265625, 23.5625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 6.0, 10.0, 9.0, 11.0, 13.0, 18.0, 26.0, 31.0, 44.0, 53.0, 67.0, 78.0, 118.0, 154.0, 203.0, 239.0, 365.0, 478.0, 749.0, 1203.0, 2351.0, 6977.0, 48624.0, 4094778.0, 26877.0, 5216.0, 2022.0, 1122.0, 683.0, 415.0, 353.0, 229.0, 194.0, 121.0, 98.0, 84.0, 63.0, 55.0, 42.0, 25.0, 12.0, 23.0, 13.0, 13.0, 10.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0], "bins": [-117.6875, -113.9375, -110.1875, -106.4375, -102.6875, -98.9375, -95.1875, -91.4375, -87.6875, -83.9375, -80.1875, -76.4375, -72.6875, -68.9375, -65.1875, -61.4375, -57.6875, -53.9375, -50.1875, -46.4375, -42.6875, -38.9375, -35.1875, -31.4375, -27.6875, -23.9375, -20.1875, -16.4375, -12.6875, -8.9375, -5.1875, -1.4375, 2.3125, 6.0625, 9.8125, 13.5625, 17.3125, 21.0625, 24.8125, 28.5625, 32.3125, 36.0625, 39.8125, 43.5625, 47.3125, 51.0625, 54.8125, 58.5625, 62.3125, 66.0625, 69.8125, 73.5625, 77.3125, 81.0625, 84.8125, 88.5625, 92.3125, 96.0625, 99.8125, 103.5625, 107.3125, 111.0625, 114.8125, 118.5625, 122.3125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 0.0, 0.0, 0.0, 6.0, 10.0, 21.0, 32.0, 140.0, 3739.0, 80.0, 20.0, 12.0, 8.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-40.65625, -39.470703125, -38.28515625, -37.099609375, -35.9140625, -34.728515625, -33.54296875, -32.357421875, -31.171875, -29.986328125, -28.80078125, -27.615234375, -26.4296875, -25.244140625, -24.05859375, -22.873046875, -21.6875, -20.501953125, -19.31640625, -18.130859375, -16.9453125, -15.759765625, -14.57421875, -13.388671875, -12.203125, -11.017578125, -9.83203125, -8.646484375, -7.4609375, -6.275390625, -5.08984375, -3.904296875, -2.71875, -1.533203125, -0.34765625, 0.837890625, 2.0234375, 3.208984375, 4.39453125, 5.580078125, 6.765625, 7.951171875, 9.13671875, 10.322265625, 11.5078125, 12.693359375, 13.87890625, 15.064453125, 16.25, 17.435546875, 18.62109375, 19.806640625, 20.9921875, 22.177734375, 23.36328125, 24.548828125, 25.734375, 26.919921875, 28.10546875, 29.291015625, 30.4765625, 31.662109375, 32.84765625, 34.033203125, 35.21875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 4.0, 8.0, 8.0, 21.0, 31.0, 45.0, 61.0, 101.0, 116.0, 164.0, 133.0, 111.0, 75.0, 57.0, 24.0, 21.0, 9.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-145.93319702148438, -142.6768341064453, -139.4204559326172, -136.16409301757812, -132.90771484375, -129.65135192871094, -126.39498901367188, -123.13861846923828, -119.88224792480469, -116.6258773803711, -113.3695068359375, -110.11314392089844, -106.85677337646484, -103.60040283203125, -100.34403991699219, -97.0876693725586, -93.831298828125, -90.5749282836914, -87.31855773925781, -84.06219482421875, -80.80582427978516, -77.54945373535156, -74.2930908203125, -71.0367202758789, -67.78034973144531, -64.52397918701172, -61.26761245727539, -58.01124572753906, -54.75487518310547, -51.498504638671875, -48.24213790893555, -44.98577117919922, -41.729393005371094, -38.4730224609375, -35.21665573120117, -31.96028709411621, -28.70391845703125, -25.44754981994629, -22.191181182861328, -18.934812545776367, -15.678443908691406, -12.422075271606445, -9.165706634521484, -5.909337997436523, -2.6529693603515625, 0.6033992767333984, 3.8597679138183594, 7.11613655090332, 10.372505187988281, 13.628873825073242, 16.885242462158203, 20.141611099243164, 23.397979736328125, 26.654348373413086, 29.910717010498047, 33.167083740234375, 36.42345428466797, 39.67982482910156, 42.93619155883789, 46.19255828857422, 49.44892883300781, 52.705299377441406, 55.961666107177734, 59.21803283691406, 62.474403381347656]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 2.0, 6.0, 2.0, 10.0, 8.0, 9.0, 16.0, 21.0, 12.0, 18.0, 19.0, 23.0, 20.0, 36.0, 36.0, 44.0, 39.0, 57.0, 50.0, 49.0, 29.0, 58.0, 41.0, 56.0, 49.0, 29.0, 34.0, 38.0, 29.0, 33.0, 25.0, 24.0, 19.0, 14.0, 15.0, 6.0, 6.0, 3.0, 7.0, 2.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.32720947265625, -50.669002532958984, -49.01079559326172, -47.35259246826172, -45.69438552856445, -44.03617858886719, -42.37797164916992, -40.719764709472656, -39.061561584472656, -37.40335464477539, -35.745147705078125, -34.086944580078125, -32.42873764038086, -30.770530700683594, -29.112323760986328, -27.454116821289062, -25.795909881591797, -24.13770294189453, -22.4794979095459, -20.821290969848633, -19.1630859375, -17.504878997802734, -15.846672058105469, -14.18846607208252, -12.53026008605957, -10.872054100036621, -9.213848114013672, -7.555641174316406, -5.897435188293457, -4.239229202270508, -2.581022262573242, -0.922816276550293, 0.7353897094726562, 2.3935959339141846, 4.051802158355713, 5.71000862121582, 7.3682146072387695, 9.026420593261719, 10.684627532958984, 12.342833518981934, 14.001039505004883, 15.659245491027832, 17.31745147705078, 18.975658416748047, 20.633865356445312, 22.292070388793945, 23.95027732849121, 25.608482360839844, 27.26668930053711, 28.924896240234375, 30.583101272583008, 32.241310119628906, 33.899513244628906, 35.55772018432617, 37.21592712402344, 38.8741340637207, 40.53234100341797, 42.190547943115234, 43.8487548828125, 45.5069580078125, 47.165164947509766, 48.82337188720703, 50.4815788269043, 52.13978576660156, 53.79798889160156]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 5.0, 8.0, 20.0, 21.0, 31.0, 43.0, 56.0, 76.0, 146.0, 197.0, 333.0, 538.0, 854.0, 1633.0, 2928.0, 5389.0, 10765.0, 22444.0, 54076.0, 156233.0, 425405.0, 234820.0, 74171.0, 29782.0, 13557.0, 6627.0, 3454.0, 1845.0, 1129.0, 725.0, 420.0, 263.0, 171.0, 131.0, 72.0, 54.0, 35.0, 17.0, 24.0, 20.0, 9.0, 10.0, 5.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-80.1875, -77.8056640625, -75.423828125, -73.0419921875, -70.66015625, -68.2783203125, -65.896484375, -63.5146484375, -61.1328125, -58.7509765625, -56.369140625, -53.9873046875, -51.60546875, -49.2236328125, -46.841796875, -44.4599609375, -42.078125, -39.6962890625, -37.314453125, -34.9326171875, -32.55078125, -30.1689453125, -27.787109375, -25.4052734375, -23.0234375, -20.6416015625, -18.259765625, -15.8779296875, -13.49609375, -11.1142578125, -8.732421875, -6.3505859375, -3.96875, -1.5869140625, 0.794921875, 3.1767578125, 5.55859375, 7.9404296875, 10.322265625, 12.7041015625, 15.0859375, 17.4677734375, 19.849609375, 22.2314453125, 24.61328125, 26.9951171875, 29.376953125, 31.7587890625, 34.140625, 36.5224609375, 38.904296875, 41.2861328125, 43.66796875, 46.0498046875, 48.431640625, 50.8134765625, 53.1953125, 55.5771484375, 57.958984375, 60.3408203125, 62.72265625, 65.1044921875, 67.486328125, 69.8681640625, 72.25]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 8.0, 9.0, 10.0, 11.0, 12.0, 18.0, 29.0, 19.0, 32.0, 32.0, 38.0, 47.0, 39.0, 44.0, 49.0, 73.0, 56.0, 45.0, 60.0, 39.0, 52.0, 46.0, 34.0, 32.0, 22.0, 24.0, 25.0, 16.0, 19.0, 11.0, 11.0, 11.0, 8.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.421875, -22.66064453125, -21.8994140625, -21.13818359375, -20.376953125, -19.61572265625, -18.8544921875, -18.09326171875, -17.33203125, -16.57080078125, -15.8095703125, -15.04833984375, -14.287109375, -13.52587890625, -12.7646484375, -12.00341796875, -11.2421875, -10.48095703125, -9.7197265625, -8.95849609375, -8.197265625, -7.43603515625, -6.6748046875, -5.91357421875, -5.15234375, -4.39111328125, -3.6298828125, -2.86865234375, -2.107421875, -1.34619140625, -0.5849609375, 0.17626953125, 0.9375, 1.69873046875, 2.4599609375, 3.22119140625, 3.982421875, 4.74365234375, 5.5048828125, 6.26611328125, 7.02734375, 7.78857421875, 8.5498046875, 9.31103515625, 10.072265625, 10.83349609375, 11.5947265625, 12.35595703125, 13.1171875, 13.87841796875, 14.6396484375, 15.40087890625, 16.162109375, 16.92333984375, 17.6845703125, 18.44580078125, 19.20703125, 19.96826171875, 20.7294921875, 21.49072265625, 22.251953125, 23.01318359375, 23.7744140625, 24.53564453125, 25.296875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 8.0, 7.0, 21.0, 20.0, 30.0, 35.0, 62.0, 98.0, 129.0, 247.0, 433.0, 813.0, 2352.0, 10912.0, 190262.0, 806223.0, 30144.0, 4153.0, 1215.0, 566.0, 304.0, 166.0, 112.0, 73.0, 56.0, 29.0, 21.0, 16.0, 12.0, 8.0, 2.0, 6.0, 6.0, 4.0, 1.0, 1.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-309.25, -300.46875, -291.6875, -282.90625, -274.125, -265.34375, -256.5625, -247.78125, -239.0, -230.21875, -221.4375, -212.65625, -203.875, -195.09375, -186.3125, -177.53125, -168.75, -159.96875, -151.1875, -142.40625, -133.625, -124.84375, -116.0625, -107.28125, -98.5, -89.71875, -80.9375, -72.15625, -63.375, -54.59375, -45.8125, -37.03125, -28.25, -19.46875, -10.6875, -1.90625, 6.875, 15.65625, 24.4375, 33.21875, 42.0, 50.78125, 59.5625, 68.34375, 77.125, 85.90625, 94.6875, 103.46875, 112.25, 121.03125, 129.8125, 138.59375, 147.375, 156.15625, 164.9375, 173.71875, 182.5, 191.28125, 200.0625, 208.84375, 217.625, 226.40625, 235.1875, 243.96875, 252.75]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 6.0, 7.0, 5.0, 9.0, 12.0, 16.0, 17.0, 23.0, 17.0, 18.0, 25.0, 26.0, 33.0, 30.0, 39.0, 41.0, 41.0, 41.0, 44.0, 41.0, 49.0, 35.0, 50.0, 37.0, 41.0, 34.0, 41.0, 32.0, 27.0, 31.0, 24.0, 10.0, 18.0, 12.0, 16.0, 17.0, 8.0, 5.0, 9.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-104.4375, -100.9912109375, -97.544921875, -94.0986328125, -90.65234375, -87.2060546875, -83.759765625, -80.3134765625, -76.8671875, -73.4208984375, -69.974609375, -66.5283203125, -63.08203125, -59.6357421875, -56.189453125, -52.7431640625, -49.296875, -45.8505859375, -42.404296875, -38.9580078125, -35.51171875, -32.0654296875, -28.619140625, -25.1728515625, -21.7265625, -18.2802734375, -14.833984375, -11.3876953125, -7.94140625, -4.4951171875, -1.048828125, 2.3974609375, 5.84375, 9.2900390625, 12.736328125, 16.1826171875, 19.62890625, 23.0751953125, 26.521484375, 29.9677734375, 33.4140625, 36.8603515625, 40.306640625, 43.7529296875, 47.19921875, 50.6455078125, 54.091796875, 57.5380859375, 60.984375, 64.4306640625, 67.876953125, 71.3232421875, 74.76953125, 78.2158203125, 81.662109375, 85.1083984375, 88.5546875, 92.0009765625, 95.447265625, 98.8935546875, 102.33984375, 105.7861328125, 109.232421875, 112.6787109375, 116.125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 8.0, 0.0, 4.0, 6.0, 11.0, 11.0, 14.0, 23.0, 35.0, 53.0, 63.0, 112.0, 186.0, 304.0, 567.0, 1252.0, 2879.0, 8350.0, 35631.0, 431036.0, 514378.0, 39141.0, 8778.0, 3011.0, 1209.0, 593.0, 317.0, 229.0, 116.0, 72.0, 53.0, 38.0, 19.0, 13.0, 8.0, 8.0, 5.0, 8.0, 7.0, 1.0, 4.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-103.375, -100.3369140625, -97.298828125, -94.2607421875, -91.22265625, -88.1845703125, -85.146484375, -82.1083984375, -79.0703125, -76.0322265625, -72.994140625, -69.9560546875, -66.91796875, -63.8798828125, -60.841796875, -57.8037109375, -54.765625, -51.7275390625, -48.689453125, -45.6513671875, -42.61328125, -39.5751953125, -36.537109375, -33.4990234375, -30.4609375, -27.4228515625, -24.384765625, -21.3466796875, -18.30859375, -15.2705078125, -12.232421875, -9.1943359375, -6.15625, -3.1181640625, -0.080078125, 2.9580078125, 5.99609375, 9.0341796875, 12.072265625, 15.1103515625, 18.1484375, 21.1865234375, 24.224609375, 27.2626953125, 30.30078125, 33.3388671875, 36.376953125, 39.4150390625, 42.453125, 45.4912109375, 48.529296875, 51.5673828125, 54.60546875, 57.6435546875, 60.681640625, 63.7197265625, 66.7578125, 69.7958984375, 72.833984375, 75.8720703125, 78.91015625, 81.9482421875, 84.986328125, 88.0244140625, 91.0625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 5.0, 2.0, 8.0, 8.0, 9.0, 21.0, 18.0, 28.0, 58.0, 81.0, 135.0, 160.0, 144.0, 108.0, 70.0, 45.0, 28.0, 22.0, 15.0, 8.0, 5.0, 9.0, 3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01465606689453125, -0.014194130897521973, -0.013732194900512695, -0.013270258903503418, -0.01280832290649414, -0.012346386909484863, -0.011884450912475586, -0.011422514915466309, -0.010960578918457031, -0.010498642921447754, -0.010036706924438477, -0.0095747709274292, -0.009112834930419922, -0.008650898933410645, -0.008188962936401367, -0.00772702693939209, -0.0072650909423828125, -0.006803154945373535, -0.006341218948364258, -0.0058792829513549805, -0.005417346954345703, -0.004955410957336426, -0.0044934749603271484, -0.004031538963317871, -0.0035696029663085938, -0.0031076669692993164, -0.002645730972290039, -0.0021837949752807617, -0.0017218589782714844, -0.001259922981262207, -0.0007979869842529297, -0.00033605098724365234, 0.000125885009765625, 0.0005878210067749023, 0.0010497570037841797, 0.001511693000793457, 0.0019736289978027344, 0.0024355649948120117, 0.002897500991821289, 0.0033594369888305664, 0.0038213729858398438, 0.004283308982849121, 0.0047452449798583984, 0.005207180976867676, 0.005669116973876953, 0.0061310529708862305, 0.006592988967895508, 0.007054924964904785, 0.0075168609619140625, 0.00797879695892334, 0.008440732955932617, 0.008902668952941895, 0.009364604949951172, 0.00982654094696045, 0.010288476943969727, 0.010750412940979004, 0.011212348937988281, 0.011674284934997559, 0.012136220932006836, 0.012598156929016113, 0.01306009292602539, 0.013522028923034668, 0.013983964920043945, 0.014445900917053223, 0.0149078369140625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 7.0, 7.0, 10.0, 27.0, 26.0, 51.0, 86.0, 188.0, 353.0, 863.0, 2445.0, 11430.0, 218698.0, 786906.0, 21716.0, 3689.0, 1151.0, 422.0, 198.0, 104.0, 57.0, 38.0, 21.0, 22.0, 8.0, 9.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-129.0, -123.87109375, -118.7421875, -113.61328125, -108.484375, -103.35546875, -98.2265625, -93.09765625, -87.96875, -82.83984375, -77.7109375, -72.58203125, -67.453125, -62.32421875, -57.1953125, -52.06640625, -46.9375, -41.80859375, -36.6796875, -31.55078125, -26.421875, -21.29296875, -16.1640625, -11.03515625, -5.90625, -0.77734375, 4.3515625, 9.48046875, 14.609375, 19.73828125, 24.8671875, 29.99609375, 35.125, 40.25390625, 45.3828125, 50.51171875, 55.640625, 60.76953125, 65.8984375, 71.02734375, 76.15625, 81.28515625, 86.4140625, 91.54296875, 96.671875, 101.80078125, 106.9296875, 112.05859375, 117.1875, 122.31640625, 127.4453125, 132.57421875, 137.703125, 142.83203125, 147.9609375, 153.08984375, 158.21875, 163.34765625, 168.4765625, 173.60546875, 178.734375, 183.86328125, 188.9921875, 194.12109375, 199.25]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 11.0, 14.0, 16.0, 23.0, 44.0, 60.0, 90.0, 140.0, 130.0, 130.0, 102.0, 76.0, 48.0, 38.0, 26.0, 12.0, 9.0, 6.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.0625, -94.76171875, -91.4609375, -88.16015625, -84.859375, -81.55859375, -78.2578125, -74.95703125, -71.65625, -68.35546875, -65.0546875, -61.75390625, -58.453125, -55.15234375, -51.8515625, -48.55078125, -45.25, -41.94921875, -38.6484375, -35.34765625, -32.046875, -28.74609375, -25.4453125, -22.14453125, -18.84375, -15.54296875, -12.2421875, -8.94140625, -5.640625, -2.33984375, 0.9609375, 4.26171875, 7.5625, 10.86328125, 14.1640625, 17.46484375, 20.765625, 24.06640625, 27.3671875, 30.66796875, 33.96875, 37.26953125, 40.5703125, 43.87109375, 47.171875, 50.47265625, 53.7734375, 57.07421875, 60.375, 63.67578125, 66.9765625, 70.27734375, 73.578125, 76.87890625, 80.1796875, 83.48046875, 86.78125, 90.08203125, 93.3828125, 96.68359375, 99.984375, 103.28515625, 106.5859375, 109.88671875, 113.1875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 8.0, 10.0, 22.0, 68.0, 126.0, 263.0, 267.0, 138.0, 56.0, 25.0, 11.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2293.167724609375, -2232.886474609375, -2172.60546875, -2112.32421875, -2052.04296875, -1991.7618408203125, -1931.480712890625, -1871.199462890625, -1810.9183349609375, -1750.63720703125, -1690.35595703125, -1630.0748291015625, -1569.793701171875, -1509.512451171875, -1449.2313232421875, -1388.9501953125, -1328.6689453125, -1268.3878173828125, -1208.1065673828125, -1147.825439453125, -1087.544189453125, -1027.2630615234375, -966.98193359375, -906.7007446289062, -846.4195556640625, -786.1383666992188, -725.857177734375, -665.5760498046875, -605.2948608398438, -545.013671875, -484.7325134277344, -424.45135498046875, -364.170166015625, -303.88897705078125, -243.60781860351562, -183.32664489746094, -123.04547119140625, -62.7642822265625, -2.483123779296875, 57.79803466796875, 118.0792236328125, 178.3603973388672, 238.64157104492188, 298.9227294921875, 359.20391845703125, 419.485107421875, 479.7662658691406, 540.0474243164062, 600.32861328125, 660.6098022460938, 720.8909912109375, 781.172119140625, 841.4533081054688, 901.7344970703125, 962.015625, 1022.2968139648438, 1082.5780029296875, 1142.859130859375, 1203.140380859375, 1263.4215087890625, 1323.70263671875, 1383.98388671875, 1444.2650146484375, 1504.546142578125, 1564.827392578125]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 2.0, 6.0, 9.0, 7.0, 13.0, 17.0, 18.0, 21.0, 31.0, 24.0, 28.0, 31.0, 44.0, 45.0, 42.0, 62.0, 72.0, 52.0, 54.0, 69.0, 57.0, 43.0, 44.0, 33.0, 39.0, 29.0, 17.0, 16.0, 20.0, 14.0, 8.0, 11.0, 7.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-727.3292846679688, -705.3887939453125, -683.4483032226562, -661.5078125, -639.5673217773438, -617.6268310546875, -595.6864013671875, -573.745849609375, -551.805419921875, -529.8649291992188, -507.9244384765625, -485.98394775390625, -464.04345703125, -442.10296630859375, -420.1625061035156, -398.2220153808594, -376.281494140625, -354.34100341796875, -332.4005126953125, -310.46002197265625, -288.51953125, -266.57904052734375, -244.63858032226562, -222.69808959960938, -200.75759887695312, -178.81710815429688, -156.87661743164062, -134.93614196777344, -112.99565124511719, -91.05516052246094, -69.11468505859375, -47.1741943359375, -25.233642578125, -3.2931556701660156, 18.64733123779297, 40.58781433105469, 62.52830505371094, 84.46879577636719, 106.40927124023438, 128.34976196289062, 150.29025268554688, 172.23074340820312, 194.17123413085938, 216.11170959472656, 238.0522003173828, 259.99267578125, 281.93316650390625, 303.8736572265625, 325.81414794921875, 347.754638671875, 369.69512939453125, 391.6356201171875, 413.57611083984375, 435.5166015625, 457.4570617675781, 479.3975524902344, 501.3380432128906, 523.2785034179688, 545.218994140625, 567.1594848632812, 589.0999755859375, 611.0404663085938, 632.98095703125, 654.9214477539062, 676.8619384765625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 10.0, 3.0, 9.0, 14.0, 13.0, 32.0, 29.0, 46.0, 88.0, 131.0, 179.0, 288.0, 493.0, 777.0, 1642.0, 4863.0, 4140662.0, 38566.0, 3239.0, 1299.0, 640.0, 418.0, 257.0, 166.0, 108.0, 77.0, 58.0, 36.0, 27.0, 23.0, 20.0, 18.0, 14.0, 9.0, 5.0, 4.0, 7.0, 3.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-315.25, -306.703125, -298.15625, -289.609375, -281.0625, -272.515625, -263.96875, -255.421875, -246.875, -238.328125, -229.78125, -221.234375, -212.6875, -204.140625, -195.59375, -187.046875, -178.5, -169.953125, -161.40625, -152.859375, -144.3125, -135.765625, -127.21875, -118.671875, -110.125, -101.578125, -93.03125, -84.484375, -75.9375, -67.390625, -58.84375, -50.296875, -41.75, -33.203125, -24.65625, -16.109375, -7.5625, 0.984375, 9.53125, 18.078125, 26.625, 35.171875, 43.71875, 52.265625, 60.8125, 69.359375, 77.90625, 86.453125, 95.0, 103.546875, 112.09375, 120.640625, 129.1875, 137.734375, 146.28125, 154.828125, 163.375, 171.921875, 180.46875, 189.015625, 197.5625, 206.109375, 214.65625, 223.203125, 231.75]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 7.0, 2.0, 3.0, 5.0, 4.0, 6.0, 8.0, 15.0, 13.0, 36.0, 22.0, 36.0, 41.0, 50.0, 50.0, 49.0, 60.0, 65.0, 62.0, 76.0, 56.0, 61.0, 54.0, 46.0, 43.0, 27.0, 18.0, 22.0, 16.0, 15.0, 10.0, 7.0, 4.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.234375, -28.30224609375, -27.3701171875, -26.43798828125, -25.505859375, -24.57373046875, -23.6416015625, -22.70947265625, -21.77734375, -20.84521484375, -19.9130859375, -18.98095703125, -18.048828125, -17.11669921875, -16.1845703125, -15.25244140625, -14.3203125, -13.38818359375, -12.4560546875, -11.52392578125, -10.591796875, -9.65966796875, -8.7275390625, -7.79541015625, -6.86328125, -5.93115234375, -4.9990234375, -4.06689453125, -3.134765625, -2.20263671875, -1.2705078125, -0.33837890625, 0.59375, 1.52587890625, 2.4580078125, 3.39013671875, 4.322265625, 5.25439453125, 6.1865234375, 7.11865234375, 8.05078125, 8.98291015625, 9.9150390625, 10.84716796875, 11.779296875, 12.71142578125, 13.6435546875, 14.57568359375, 15.5078125, 16.43994140625, 17.3720703125, 18.30419921875, 19.236328125, 20.16845703125, 21.1005859375, 22.03271484375, 22.96484375, 23.89697265625, 24.8291015625, 25.76123046875, 26.693359375, 27.62548828125, 28.5576171875, 29.48974609375, 30.421875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 4.0, 7.0, 3.0, 8.0, 13.0, 8.0, 12.0, 27.0, 34.0, 40.0, 69.0, 93.0, 135.0, 212.0, 305.0, 484.0, 881.0, 1669.0, 3755.0, 17030.0, 4136542.0, 24003.0, 4472.0, 1842.0, 980.0, 579.0, 354.0, 241.0, 142.0, 92.0, 67.0, 56.0, 30.0, 35.0, 18.0, 15.0, 4.0, 5.0, 3.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-197.375, -191.978515625, -186.58203125, -181.185546875, -175.7890625, -170.392578125, -164.99609375, -159.599609375, -154.203125, -148.806640625, -143.41015625, -138.013671875, -132.6171875, -127.220703125, -121.82421875, -116.427734375, -111.03125, -105.634765625, -100.23828125, -94.841796875, -89.4453125, -84.048828125, -78.65234375, -73.255859375, -67.859375, -62.462890625, -57.06640625, -51.669921875, -46.2734375, -40.876953125, -35.48046875, -30.083984375, -24.6875, -19.291015625, -13.89453125, -8.498046875, -3.1015625, 2.294921875, 7.69140625, 13.087890625, 18.484375, 23.880859375, 29.27734375, 34.673828125, 40.0703125, 45.466796875, 50.86328125, 56.259765625, 61.65625, 67.052734375, 72.44921875, 77.845703125, 83.2421875, 88.638671875, 94.03515625, 99.431640625, 104.828125, 110.224609375, 115.62109375, 121.017578125, 126.4140625, 131.810546875, 137.20703125, 142.603515625, 148.0]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 18.0, 26.0, 106.0, 3840.0, 31.0, 16.0, 10.0, 5.0, 3.0, 8.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.90625, -26.7548828125, -25.603515625, -24.4521484375, -23.30078125, -22.1494140625, -20.998046875, -19.8466796875, -18.6953125, -17.5439453125, -16.392578125, -15.2412109375, -14.08984375, -12.9384765625, -11.787109375, -10.6357421875, -9.484375, -8.3330078125, -7.181640625, -6.0302734375, -4.87890625, -3.7275390625, -2.576171875, -1.4248046875, -0.2734375, 0.8779296875, 2.029296875, 3.1806640625, 4.33203125, 5.4833984375, 6.634765625, 7.7861328125, 8.9375, 10.0888671875, 11.240234375, 12.3916015625, 13.54296875, 14.6943359375, 15.845703125, 16.9970703125, 18.1484375, 19.2998046875, 20.451171875, 21.6025390625, 22.75390625, 23.9052734375, 25.056640625, 26.2080078125, 27.359375, 28.5107421875, 29.662109375, 30.8134765625, 31.96484375, 33.1162109375, 34.267578125, 35.4189453125, 36.5703125, 37.7216796875, 38.873046875, 40.0244140625, 41.17578125, 42.3271484375, 43.478515625, 44.6298828125, 45.78125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 8.0, 9.0, 35.0, 69.0, 151.0, 242.0, 211.0, 120.0, 61.0, 43.0, 20.0, 13.0, 7.0, 9.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-217.599853515625, -211.98501586914062, -206.37017822265625, -200.75534057617188, -195.1405029296875, -189.5256805419922, -183.9108428955078, -178.29600524902344, -172.68116760253906, -167.0663299560547, -161.4514923095703, -155.83665466308594, -150.22183227539062, -144.60699462890625, -138.99215698242188, -133.3773193359375, -127.76248168945312, -122.14764404296875, -116.53280639648438, -110.91797637939453, -105.30313873291016, -99.68830108642578, -94.07347106933594, -88.45863342285156, -82.84379577636719, -77.22895812988281, -71.61412048339844, -65.9992904663086, -60.38445281982422, -54.769615173339844, -49.154781341552734, -43.539947509765625, -37.92510986328125, -32.310272216796875, -26.695438385009766, -21.080602645874023, -15.465766906738281, -9.850931167602539, -4.236095428466797, 1.3787384033203125, 6.9935760498046875, 12.60841178894043, 18.223247528076172, 23.838083267211914, 29.452919006347656, 35.06775665283203, 40.68259048461914, 46.29742431640625, 51.912261962890625, 57.527099609375, 63.14193344116211, 68.75676727294922, 74.3716049194336, 79.98644256591797, 85.60127258300781, 91.21611022949219, 96.83094787597656, 102.44578552246094, 108.06062316894531, 113.67545318603516, 119.29029083251953, 124.9051284790039, 130.51995849609375, 136.13479614257812, 141.7496337890625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 6.0, 5.0, 6.0, 13.0, 8.0, 12.0, 19.0, 19.0, 28.0, 22.0, 38.0, 24.0, 39.0, 35.0, 42.0, 42.0, 43.0, 52.0, 37.0, 36.0, 44.0, 50.0, 28.0, 37.0, 29.0, 31.0, 34.0, 35.0, 34.0, 18.0, 35.0, 19.0, 16.0, 13.0, 14.0, 16.0, 4.0, 8.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-51.24619674682617, -49.57110595703125, -47.89601516723633, -46.220924377441406, -44.54583740234375, -42.87074279785156, -41.195655822753906, -39.520565032958984, -37.84547424316406, -36.17038345336914, -34.49529266357422, -32.8202018737793, -31.145112991333008, -29.470022201538086, -27.794933319091797, -26.119842529296875, -24.444751739501953, -22.76966094970703, -21.09457015991211, -19.41948127746582, -17.7443904876709, -16.069299697875977, -14.394209861755371, -12.719120025634766, -11.044029235839844, -9.368938446044922, -7.693848609924316, -6.018758296966553, -4.343667984008789, -2.668577194213867, -0.9934873580932617, 0.6816024780273438, 2.3566932678222656, 4.031783580780029, 5.706873893737793, 7.381964206695557, 9.05705451965332, 10.732145309448242, 12.407235145568848, 14.082324981689453, 15.757415771484375, 17.432506561279297, 19.10759735107422, 20.782686233520508, 22.45777702331543, 24.13286781311035, 25.80795669555664, 27.483047485351562, 29.158138275146484, 30.833229064941406, 32.50831985473633, 34.18341064453125, 35.858497619628906, 37.533592224121094, 39.20867919921875, 40.88376998901367, 42.558860778808594, 44.233951568603516, 45.90904235839844, 47.58413314819336, 49.25922393798828, 50.93431091308594, 52.60940170288086, 54.28449249267578, 55.9595832824707]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 10.0, 9.0, 10.0, 22.0, 22.0, 48.0, 83.0, 104.0, 182.0, 343.0, 602.0, 1159.0, 2513.0, 5535.0, 14733.0, 43389.0, 157890.0, 497420.0, 231752.0, 60019.0, 19244.0, 7337.0, 3071.0, 1379.0, 709.0, 363.0, 225.0, 146.0, 84.0, 47.0, 27.0, 19.0, 25.0, 10.0, 6.0, 6.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-87.6875, -84.728515625, -81.76953125, -78.810546875, -75.8515625, -72.892578125, -69.93359375, -66.974609375, -64.015625, -61.056640625, -58.09765625, -55.138671875, -52.1796875, -49.220703125, -46.26171875, -43.302734375, -40.34375, -37.384765625, -34.42578125, -31.466796875, -28.5078125, -25.548828125, -22.58984375, -19.630859375, -16.671875, -13.712890625, -10.75390625, -7.794921875, -4.8359375, -1.876953125, 1.08203125, 4.041015625, 7.0, 9.958984375, 12.91796875, 15.876953125, 18.8359375, 21.794921875, 24.75390625, 27.712890625, 30.671875, 33.630859375, 36.58984375, 39.548828125, 42.5078125, 45.466796875, 48.42578125, 51.384765625, 54.34375, 57.302734375, 60.26171875, 63.220703125, 66.1796875, 69.138671875, 72.09765625, 75.056640625, 78.015625, 80.974609375, 83.93359375, 86.892578125, 89.8515625, 92.810546875, 95.76953125, 98.728515625, 101.6875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 7.0, 5.0, 4.0, 6.0, 10.0, 13.0, 11.0, 21.0, 22.0, 31.0, 40.0, 42.0, 47.0, 69.0, 48.0, 65.0, 56.0, 62.0, 69.0, 43.0, 55.0, 44.0, 33.0, 32.0, 34.0, 33.0, 20.0, 16.0, 14.0, 10.0, 7.0, 8.0, 5.0, 6.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.65625, -27.733642578125, -26.81103515625, -25.888427734375, -24.9658203125, -24.043212890625, -23.12060546875, -22.197998046875, -21.275390625, -20.352783203125, -19.43017578125, -18.507568359375, -17.5849609375, -16.662353515625, -15.73974609375, -14.817138671875, -13.89453125, -12.971923828125, -12.04931640625, -11.126708984375, -10.2041015625, -9.281494140625, -8.35888671875, -7.436279296875, -6.513671875, -5.591064453125, -4.66845703125, -3.745849609375, -2.8232421875, -1.900634765625, -0.97802734375, -0.055419921875, 0.8671875, 1.789794921875, 2.71240234375, 3.635009765625, 4.5576171875, 5.480224609375, 6.40283203125, 7.325439453125, 8.248046875, 9.170654296875, 10.09326171875, 11.015869140625, 11.9384765625, 12.861083984375, 13.78369140625, 14.706298828125, 15.62890625, 16.551513671875, 17.47412109375, 18.396728515625, 19.3193359375, 20.241943359375, 21.16455078125, 22.087158203125, 23.009765625, 23.932373046875, 24.85498046875, 25.777587890625, 26.7001953125, 27.622802734375, 28.54541015625, 29.468017578125, 30.390625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 5.0, 7.0, 9.0, 6.0, 7.0, 9.0, 16.0, 35.0, 35.0, 49.0, 74.0, 110.0, 186.0, 316.0, 540.0, 1145.0, 3132.0, 13859.0, 156182.0, 793961.0, 66449.0, 8067.0, 2237.0, 897.0, 469.0, 250.0, 172.0, 93.0, 73.0, 48.0, 27.0, 27.0, 16.0, 24.0, 8.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-195.5, -189.263671875, -183.02734375, -176.791015625, -170.5546875, -164.318359375, -158.08203125, -151.845703125, -145.609375, -139.373046875, -133.13671875, -126.900390625, -120.6640625, -114.427734375, -108.19140625, -101.955078125, -95.71875, -89.482421875, -83.24609375, -77.009765625, -70.7734375, -64.537109375, -58.30078125, -52.064453125, -45.828125, -39.591796875, -33.35546875, -27.119140625, -20.8828125, -14.646484375, -8.41015625, -2.173828125, 4.0625, 10.298828125, 16.53515625, 22.771484375, 29.0078125, 35.244140625, 41.48046875, 47.716796875, 53.953125, 60.189453125, 66.42578125, 72.662109375, 78.8984375, 85.134765625, 91.37109375, 97.607421875, 103.84375, 110.080078125, 116.31640625, 122.552734375, 128.7890625, 135.025390625, 141.26171875, 147.498046875, 153.734375, 159.970703125, 166.20703125, 172.443359375, 178.6796875, 184.916015625, 191.15234375, 197.388671875, 203.625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 9.0, 11.0, 9.0, 12.0, 15.0, 15.0, 11.0, 19.0, 22.0, 29.0, 34.0, 32.0, 31.0, 52.0, 47.0, 50.0, 46.0, 41.0, 49.0, 49.0, 44.0, 41.0, 37.0, 43.0, 28.0, 34.0, 29.0, 31.0, 24.0, 18.0, 13.0, 16.0, 11.0, 11.0, 7.0, 9.0, 3.0, 4.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-130.5, -126.5693359375, -122.638671875, -118.7080078125, -114.77734375, -110.8466796875, -106.916015625, -102.9853515625, -99.0546875, -95.1240234375, -91.193359375, -87.2626953125, -83.33203125, -79.4013671875, -75.470703125, -71.5400390625, -67.609375, -63.6787109375, -59.748046875, -55.8173828125, -51.88671875, -47.9560546875, -44.025390625, -40.0947265625, -36.1640625, -32.2333984375, -28.302734375, -24.3720703125, -20.44140625, -16.5107421875, -12.580078125, -8.6494140625, -4.71875, -0.7880859375, 3.142578125, 7.0732421875, 11.00390625, 14.9345703125, 18.865234375, 22.7958984375, 26.7265625, 30.6572265625, 34.587890625, 38.5185546875, 42.44921875, 46.3798828125, 50.310546875, 54.2412109375, 58.171875, 62.1025390625, 66.033203125, 69.9638671875, 73.89453125, 77.8251953125, 81.755859375, 85.6865234375, 89.6171875, 93.5478515625, 97.478515625, 101.4091796875, 105.33984375, 109.2705078125, 113.201171875, 117.1318359375, 121.0625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 7.0, 3.0, 2.0, 9.0, 5.0, 10.0, 16.0, 12.0, 23.0, 34.0, 55.0, 69.0, 131.0, 272.0, 710.0, 2503.0, 20152.0, 990561.0, 29416.0, 3058.0, 797.0, 329.0, 150.0, 78.0, 52.0, 28.0, 21.0, 15.0, 14.0, 9.0, 5.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-279.75, -272.09765625, -264.4453125, -256.79296875, -249.140625, -241.48828125, -233.8359375, -226.18359375, -218.53125, -210.87890625, -203.2265625, -195.57421875, -187.921875, -180.26953125, -172.6171875, -164.96484375, -157.3125, -149.66015625, -142.0078125, -134.35546875, -126.703125, -119.05078125, -111.3984375, -103.74609375, -96.09375, -88.44140625, -80.7890625, -73.13671875, -65.484375, -57.83203125, -50.1796875, -42.52734375, -34.875, -27.22265625, -19.5703125, -11.91796875, -4.265625, 3.38671875, 11.0390625, 18.69140625, 26.34375, 33.99609375, 41.6484375, 49.30078125, 56.953125, 64.60546875, 72.2578125, 79.91015625, 87.5625, 95.21484375, 102.8671875, 110.51953125, 118.171875, 125.82421875, 133.4765625, 141.12890625, 148.78125, 156.43359375, 164.0859375, 171.73828125, 179.390625, 187.04296875, 194.6953125, 202.34765625, 210.0]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 12.0, 11.0, 12.0, 19.0, 44.0, 60.0, 132.0, 177.0, 203.0, 127.0, 68.0, 56.0, 29.0, 17.0, 15.0, 9.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0268402099609375, -0.026257991790771484, -0.02567577362060547, -0.025093555450439453, -0.024511337280273438, -0.023929119110107422, -0.023346900939941406, -0.02276468276977539, -0.022182464599609375, -0.02160024642944336, -0.021018028259277344, -0.020435810089111328, -0.019853591918945312, -0.019271373748779297, -0.01868915557861328, -0.018106937408447266, -0.01752471923828125, -0.016942501068115234, -0.01636028289794922, -0.015778064727783203, -0.015195846557617188, -0.014613628387451172, -0.014031410217285156, -0.01344919204711914, -0.012866973876953125, -0.01228475570678711, -0.011702537536621094, -0.011120319366455078, -0.010538101196289062, -0.009955883026123047, -0.009373664855957031, -0.008791446685791016, -0.008209228515625, -0.007627010345458984, -0.007044792175292969, -0.006462574005126953, -0.0058803558349609375, -0.005298137664794922, -0.004715919494628906, -0.004133701324462891, -0.003551483154296875, -0.0029692649841308594, -0.0023870468139648438, -0.0018048286437988281, -0.0012226104736328125, -0.0006403923034667969, -5.817413330078125e-05, 0.0005240440368652344, 0.00110626220703125, 0.0016884803771972656, 0.0022706985473632812, 0.002852916717529297, 0.0034351348876953125, 0.004017353057861328, 0.004599571228027344, 0.005181789398193359, 0.005764007568359375, 0.006346225738525391, 0.006928443908691406, 0.007510662078857422, 0.008092880249023438, 0.008675098419189453, 0.009257316589355469, 0.009839534759521484, 0.0104217529296875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 6.0, 3.0, 5.0, 2.0, 8.0, 23.0, 26.0, 38.0, 55.0, 140.0, 280.0, 777.0, 3662.0, 65608.0, 964008.0, 11440.0, 1623.0, 453.0, 174.0, 94.0, 44.0, 36.0, 23.0, 10.0, 8.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-267.25, -259.447265625, -251.64453125, -243.841796875, -236.0390625, -228.236328125, -220.43359375, -212.630859375, -204.828125, -197.025390625, -189.22265625, -181.419921875, -173.6171875, -165.814453125, -158.01171875, -150.208984375, -142.40625, -134.603515625, -126.80078125, -118.998046875, -111.1953125, -103.392578125, -95.58984375, -87.787109375, -79.984375, -72.181640625, -64.37890625, -56.576171875, -48.7734375, -40.970703125, -33.16796875, -25.365234375, -17.5625, -9.759765625, -1.95703125, 5.845703125, 13.6484375, 21.451171875, 29.25390625, 37.056640625, 44.859375, 52.662109375, 60.46484375, 68.267578125, 76.0703125, 83.873046875, 91.67578125, 99.478515625, 107.28125, 115.083984375, 122.88671875, 130.689453125, 138.4921875, 146.294921875, 154.09765625, 161.900390625, 169.703125, 177.505859375, 185.30859375, 193.111328125, 200.9140625, 208.716796875, 216.51953125, 224.322265625, 232.125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 5.0, 4.0, 2.0, 7.0, 5.0, 13.0, 18.0, 31.0, 85.0, 277.0, 332.0, 132.0, 44.0, 16.0, 11.0, 6.0, 4.0, 4.0, 4.0, 0.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-277.75, -270.662109375, -263.57421875, -256.486328125, -249.3984375, -242.310546875, -235.22265625, -228.134765625, -221.046875, -213.958984375, -206.87109375, -199.783203125, -192.6953125, -185.607421875, -178.51953125, -171.431640625, -164.34375, -157.255859375, -150.16796875, -143.080078125, -135.9921875, -128.904296875, -121.81640625, -114.728515625, -107.640625, -100.552734375, -93.46484375, -86.376953125, -79.2890625, -72.201171875, -65.11328125, -58.025390625, -50.9375, -43.849609375, -36.76171875, -29.673828125, -22.5859375, -15.498046875, -8.41015625, -1.322265625, 5.765625, 12.853515625, 19.94140625, 27.029296875, 34.1171875, 41.205078125, 48.29296875, 55.380859375, 62.46875, 69.556640625, 76.64453125, 83.732421875, 90.8203125, 97.908203125, 104.99609375, 112.083984375, 119.171875, 126.259765625, 133.34765625, 140.435546875, 147.5234375, 154.611328125, 161.69921875, 168.787109375, 175.875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 7.0, 5.0, 18.0, 76.0, 201.0, 345.0, 221.0, 96.0, 25.0, 6.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2381.22802734375, -2300.16357421875, -2219.09912109375, -2138.03466796875, -2056.97021484375, -1975.9056396484375, -1894.841064453125, -1813.776611328125, -1732.712158203125, -1651.647705078125, -1570.583251953125, -1489.5186767578125, -1408.4542236328125, -1327.3897705078125, -1246.3251953125, -1165.2607421875, -1084.1962890625, -1003.1318359375, -922.0673217773438, -841.0028076171875, -759.9383544921875, -678.8739013671875, -597.8093872070312, -516.744873046875, -435.680419921875, -354.6159362792969, -273.55145263671875, -192.48696899414062, -111.4224853515625, -30.358001708984375, 50.70648193359375, 131.77099609375, 212.83544921875, 293.8999328613281, 374.96441650390625, 456.0289001464844, 537.0933837890625, 618.1578369140625, 699.2223510742188, 780.286865234375, 861.351318359375, 942.415771484375, 1023.4802856445312, 1104.5447998046875, 1185.6092529296875, 1266.6737060546875, 1347.73828125, 1428.802734375, 1509.8671875, 1590.931640625, 1671.99609375, 1753.0606689453125, 1834.1251220703125, 1915.1895751953125, 1996.254150390625, 2077.318603515625, 2158.383056640625, 2239.447509765625, 2320.511962890625, 2401.576416015625, 2482.64111328125, 2563.70556640625, 2644.77001953125, 2725.83447265625, 2806.89892578125]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 11.0, 8.0, 10.0, 14.0, 8.0, 16.0, 24.0, 34.0, 28.0, 44.0, 39.0, 43.0, 48.0, 49.0, 68.0, 54.0, 61.0, 60.0, 58.0, 46.0, 37.0, 45.0, 29.0, 27.0, 28.0, 29.0, 25.0, 16.0, 7.0, 10.0, 9.0, 8.0, 4.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-625.2022705078125, -599.27099609375, -573.3397216796875, -547.408447265625, -521.4771728515625, -495.5458984375, -469.6146240234375, -443.683349609375, -417.7520751953125, -391.82080078125, -365.8895263671875, -339.958251953125, -314.0269775390625, -288.095703125, -262.1644287109375, -236.233154296875, -210.3018798828125, -184.37060546875, -158.4393310546875, -132.508056640625, -106.5767822265625, -80.6455078125, -54.7142333984375, -28.782958984375, -2.8516845703125, 23.07958984375, 49.0108642578125, 74.942138671875, 100.8734130859375, 126.8046875, 152.7359619140625, 178.667236328125, 204.5985107421875, 230.52978515625, 256.4610595703125, 282.392333984375, 308.3236083984375, 334.2548828125, 360.1861572265625, 386.117431640625, 412.0487060546875, 437.97998046875, 463.9112548828125, 489.842529296875, 515.7738037109375, 541.705078125, 567.6363525390625, 593.567626953125, 619.4989013671875, 645.43017578125, 671.3614501953125, 697.292724609375, 723.2239990234375, 749.1552734375, 775.0865478515625, 801.017822265625, 826.9490966796875, 852.88037109375, 878.8116455078125, 904.742919921875, 930.6741943359375, 956.60546875, 982.5367431640625, 1008.468017578125, 1034.3992919921875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 4.0, 4.0, 7.0, 8.0, 10.0, 15.0, 16.0, 20.0, 35.0, 42.0, 66.0, 112.0, 153.0, 272.0, 421.0, 726.0, 1614.0, 5567.0, 88719.0, 4083208.0, 8932.0, 2036.0, 902.0, 482.0, 299.0, 169.0, 128.0, 98.0, 54.0, 42.0, 34.0, 11.0, 18.0, 12.0, 7.0, 12.0, 5.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-183.125, -177.048828125, -170.97265625, -164.896484375, -158.8203125, -152.744140625, -146.66796875, -140.591796875, -134.515625, -128.439453125, -122.36328125, -116.287109375, -110.2109375, -104.134765625, -98.05859375, -91.982421875, -85.90625, -79.830078125, -73.75390625, -67.677734375, -61.6015625, -55.525390625, -49.44921875, -43.373046875, -37.296875, -31.220703125, -25.14453125, -19.068359375, -12.9921875, -6.916015625, -0.83984375, 5.236328125, 11.3125, 17.388671875, 23.46484375, 29.541015625, 35.6171875, 41.693359375, 47.76953125, 53.845703125, 59.921875, 65.998046875, 72.07421875, 78.150390625, 84.2265625, 90.302734375, 96.37890625, 102.455078125, 108.53125, 114.607421875, 120.68359375, 126.759765625, 132.8359375, 138.912109375, 144.98828125, 151.064453125, 157.140625, 163.216796875, 169.29296875, 175.369140625, 181.4453125, 187.521484375, 193.59765625, 199.673828125, 205.75]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 14.0, 20.0, 19.0, 33.0, 47.0, 66.0, 100.0, 97.0, 108.0, 103.0, 98.0, 86.0, 67.0, 42.0, 24.0, 24.0, 20.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.96875, -50.177734375, -48.38671875, -46.595703125, -44.8046875, -43.013671875, -41.22265625, -39.431640625, -37.640625, -35.849609375, -34.05859375, -32.267578125, -30.4765625, -28.685546875, -26.89453125, -25.103515625, -23.3125, -21.521484375, -19.73046875, -17.939453125, -16.1484375, -14.357421875, -12.56640625, -10.775390625, -8.984375, -7.193359375, -5.40234375, -3.611328125, -1.8203125, -0.029296875, 1.76171875, 3.552734375, 5.34375, 7.134765625, 8.92578125, 10.716796875, 12.5078125, 14.298828125, 16.08984375, 17.880859375, 19.671875, 21.462890625, 23.25390625, 25.044921875, 26.8359375, 28.626953125, 30.41796875, 32.208984375, 34.0, 35.791015625, 37.58203125, 39.373046875, 41.1640625, 42.955078125, 44.74609375, 46.537109375, 48.328125, 50.119140625, 51.91015625, 53.701171875, 55.4921875, 57.283203125, 59.07421875, 60.865234375, 62.65625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 4.0, 4.0, 6.0, 7.0, 12.0, 19.0, 27.0, 35.0, 52.0, 81.0, 116.0, 157.0, 259.0, 421.0, 686.0, 1373.0, 3461.0, 14406.0, 4095882.0, 66413.0, 6274.0, 2062.0, 985.0, 539.0, 329.0, 211.0, 148.0, 96.0, 72.0, 45.0, 31.0, 21.0, 14.0, 11.0, 10.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-324.0, -315.638671875, -307.27734375, -298.916015625, -290.5546875, -282.193359375, -273.83203125, -265.470703125, -257.109375, -248.748046875, -240.38671875, -232.025390625, -223.6640625, -215.302734375, -206.94140625, -198.580078125, -190.21875, -181.857421875, -173.49609375, -165.134765625, -156.7734375, -148.412109375, -140.05078125, -131.689453125, -123.328125, -114.966796875, -106.60546875, -98.244140625, -89.8828125, -81.521484375, -73.16015625, -64.798828125, -56.4375, -48.076171875, -39.71484375, -31.353515625, -22.9921875, -14.630859375, -6.26953125, 2.091796875, 10.453125, 18.814453125, 27.17578125, 35.537109375, 43.8984375, 52.259765625, 60.62109375, 68.982421875, 77.34375, 85.705078125, 94.06640625, 102.427734375, 110.7890625, 119.150390625, 127.51171875, 135.873046875, 144.234375, 152.595703125, 160.95703125, 169.318359375, 177.6796875, 186.041015625, 194.40234375, 202.763671875, 211.125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 9.0, 5.0, 15.0, 48.0, 476.0, 3371.0, 91.0, 26.0, 11.0, 7.0, 4.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.75, -77.09375, -73.4375, -69.78125, -66.125, -62.46875, -58.8125, -55.15625, -51.5, -47.84375, -44.1875, -40.53125, -36.875, -33.21875, -29.5625, -25.90625, -22.25, -18.59375, -14.9375, -11.28125, -7.625, -3.96875, -0.3125, 3.34375, 7.0, 10.65625, 14.3125, 17.96875, 21.625, 25.28125, 28.9375, 32.59375, 36.25, 39.90625, 43.5625, 47.21875, 50.875, 54.53125, 58.1875, 61.84375, 65.5, 69.15625, 72.8125, 76.46875, 80.125, 83.78125, 87.4375, 91.09375, 94.75, 98.40625, 102.0625, 105.71875, 109.375, 113.03125, 116.6875, 120.34375, 124.0, 127.65625, 131.3125, 134.96875, 138.625, 142.28125, 145.9375, 149.59375, 153.25]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 7.0, 8.0, 18.0, 42.0, 74.0, 147.0, 219.0, 186.0, 124.0, 74.0, 37.0, 23.0, 11.0, 6.0, 13.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-222.9931182861328, -206.54884338378906, -190.10455322265625, -173.6602783203125, -157.21600341796875, -140.771728515625, -124.32744598388672, -107.88316345214844, -91.43888854980469, -74.99461364746094, -58.550331115722656, -42.10605239868164, -25.661773681640625, -9.217498779296875, 7.226783752441406, 23.671066284179688, 40.11534118652344, 56.55961990356445, 73.00389862060547, 89.44818115234375, 105.8924560546875, 122.33673095703125, 138.781005859375, 155.2252960205078, 171.66957092285156, 188.1138458251953, 204.55813598632812, 221.00241088867188, 237.44668579101562, 253.89096069335938, 270.3352355957031, 286.779541015625, 303.22381591796875, 319.6680908203125, 336.11236572265625, 352.556640625, 369.00091552734375, 385.4451904296875, 401.8894958496094, 418.3337707519531, 434.7780456542969, 451.2223205566406, 467.6665954589844, 484.1108703613281, 500.55517578125, 516.9994506835938, 533.4437255859375, 549.8880004882812, 566.332275390625, 582.7765502929688, 599.2208251953125, 615.6651000976562, 632.109375, 648.5536499023438, 664.9979248046875, 681.4422607421875, 697.886474609375, 714.3307495117188, 730.7750244140625, 747.2192993164062, 763.66357421875, 780.1078491210938, 796.5521240234375, 812.9964599609375, 829.4407348632812]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 6.0, 10.0, 7.0, 5.0, 10.0, 7.0, 20.0, 13.0, 14.0, 23.0, 24.0, 30.0, 24.0, 28.0, 28.0, 47.0, 40.0, 50.0, 37.0, 42.0, 37.0, 41.0, 54.0, 32.0, 37.0, 57.0, 25.0, 41.0, 33.0, 27.0, 27.0, 18.0, 18.0, 19.0, 16.0, 13.0, 7.0, 11.0, 8.0, 7.0, 0.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-197.54888916015625, -190.67176818847656, -183.79466247558594, -176.91754150390625, -170.04043579101562, -163.16331481933594, -156.28619384765625, -149.40908813476562, -142.53196716308594, -135.65484619140625, -128.77774047851562, -121.90061950683594, -115.02350616455078, -108.14639282226562, -101.26927185058594, -94.39215850830078, -87.51504516601562, -80.63793182373047, -73.76081848144531, -66.88369750976562, -60.00658416748047, -53.12947082519531, -46.25235366821289, -39.37523651123047, -32.49812316894531, -25.621007919311523, -18.743892669677734, -11.866777420043945, -4.989662170410156, 1.887451171875, 8.764568328857422, 15.641685485839844, 22.518798828125, 29.39591407775879, 36.27302932739258, 43.150146484375, 50.027259826660156, 56.90437316894531, 63.781490325927734, 70.65860748291016, 77.53572082519531, 84.41283416748047, 91.28994750976562, 98.16706848144531, 105.04418182373047, 111.92129516601562, 118.79841613769531, 125.67552947998047, 132.55264282226562, 139.4297637939453, 146.30686950683594, 153.18399047851562, 160.06109619140625, 166.93821716308594, 173.81533813476562, 180.69244384765625, 187.56956481933594, 194.44668579101562, 201.32379150390625, 208.20091247558594, 215.07803344726562, 221.95513916015625, 228.83226013183594, 235.70938110351562, 242.58648681640625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 7.0, 5.0, 10.0, 21.0, 15.0, 26.0, 42.0, 63.0, 73.0, 135.0, 205.0, 311.0, 482.0, 860.0, 1501.0, 2709.0, 5244.0, 11004.0, 26173.0, 72945.0, 255582.0, 450583.0, 140997.0, 45178.0, 17676.0, 7932.0, 3790.0, 2056.0, 1128.0, 682.0, 360.0, 260.0, 176.0, 115.0, 68.0, 36.0, 25.0, 17.0, 19.0, 10.0, 14.0, 4.0, 8.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-119.5625, -116.07421875, -112.5859375, -109.09765625, -105.609375, -102.12109375, -98.6328125, -95.14453125, -91.65625, -88.16796875, -84.6796875, -81.19140625, -77.703125, -74.21484375, -70.7265625, -67.23828125, -63.75, -60.26171875, -56.7734375, -53.28515625, -49.796875, -46.30859375, -42.8203125, -39.33203125, -35.84375, -32.35546875, -28.8671875, -25.37890625, -21.890625, -18.40234375, -14.9140625, -11.42578125, -7.9375, -4.44921875, -0.9609375, 2.52734375, 6.015625, 9.50390625, 12.9921875, 16.48046875, 19.96875, 23.45703125, 26.9453125, 30.43359375, 33.921875, 37.41015625, 40.8984375, 44.38671875, 47.875, 51.36328125, 54.8515625, 58.33984375, 61.828125, 65.31640625, 68.8046875, 72.29296875, 75.78125, 79.26953125, 82.7578125, 86.24609375, 89.734375, 93.22265625, 96.7109375, 100.19921875, 103.6875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 6.0, 4.0, 7.0, 8.0, 12.0, 23.0, 13.0, 22.0, 37.0, 36.0, 43.0, 56.0, 60.0, 75.0, 60.0, 65.0, 65.0, 58.0, 57.0, 47.0, 39.0, 41.0, 36.0, 27.0, 18.0, 15.0, 21.0, 5.0, 8.0, 7.0, 8.0, 5.0, 5.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-44.6875, -43.2353515625, -41.783203125, -40.3310546875, -38.87890625, -37.4267578125, -35.974609375, -34.5224609375, -33.0703125, -31.6181640625, -30.166015625, -28.7138671875, -27.26171875, -25.8095703125, -24.357421875, -22.9052734375, -21.453125, -20.0009765625, -18.548828125, -17.0966796875, -15.64453125, -14.1923828125, -12.740234375, -11.2880859375, -9.8359375, -8.3837890625, -6.931640625, -5.4794921875, -4.02734375, -2.5751953125, -1.123046875, 0.3291015625, 1.78125, 3.2333984375, 4.685546875, 6.1376953125, 7.58984375, 9.0419921875, 10.494140625, 11.9462890625, 13.3984375, 14.8505859375, 16.302734375, 17.7548828125, 19.20703125, 20.6591796875, 22.111328125, 23.5634765625, 25.015625, 26.4677734375, 27.919921875, 29.3720703125, 30.82421875, 32.2763671875, 33.728515625, 35.1806640625, 36.6328125, 38.0849609375, 39.537109375, 40.9892578125, 42.44140625, 43.8935546875, 45.345703125, 46.7978515625, 48.25]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 10.0, 13.0, 9.0, 17.0, 20.0, 37.0, 61.0, 73.0, 113.0, 178.0, 305.0, 527.0, 999.0, 2266.0, 6469.0, 26942.0, 249889.0, 681976.0, 60775.0, 11331.0, 3478.0, 1377.0, 692.0, 372.0, 204.0, 103.0, 98.0, 61.0, 52.0, 28.0, 24.0, 17.0, 12.0, 9.0, 8.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-242.5, -235.412109375, -228.32421875, -221.236328125, -214.1484375, -207.060546875, -199.97265625, -192.884765625, -185.796875, -178.708984375, -171.62109375, -164.533203125, -157.4453125, -150.357421875, -143.26953125, -136.181640625, -129.09375, -122.005859375, -114.91796875, -107.830078125, -100.7421875, -93.654296875, -86.56640625, -79.478515625, -72.390625, -65.302734375, -58.21484375, -51.126953125, -44.0390625, -36.951171875, -29.86328125, -22.775390625, -15.6875, -8.599609375, -1.51171875, 5.576171875, 12.6640625, 19.751953125, 26.83984375, 33.927734375, 41.015625, 48.103515625, 55.19140625, 62.279296875, 69.3671875, 76.455078125, 83.54296875, 90.630859375, 97.71875, 104.806640625, 111.89453125, 118.982421875, 126.0703125, 133.158203125, 140.24609375, 147.333984375, 154.421875, 161.509765625, 168.59765625, 175.685546875, 182.7734375, 189.861328125, 196.94921875, 204.037109375, 211.125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 4.0, 4.0, 6.0, 8.0, 14.0, 7.0, 11.0, 18.0, 22.0, 21.0, 34.0, 38.0, 31.0, 45.0, 50.0, 44.0, 49.0, 57.0, 64.0, 39.0, 64.0, 66.0, 50.0, 33.0, 46.0, 26.0, 24.0, 25.0, 18.0, 15.0, 15.0, 12.0, 12.0, 7.0, 11.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-207.25, -200.208984375, -193.16796875, -186.126953125, -179.0859375, -172.044921875, -165.00390625, -157.962890625, -150.921875, -143.880859375, -136.83984375, -129.798828125, -122.7578125, -115.716796875, -108.67578125, -101.634765625, -94.59375, -87.552734375, -80.51171875, -73.470703125, -66.4296875, -59.388671875, -52.34765625, -45.306640625, -38.265625, -31.224609375, -24.18359375, -17.142578125, -10.1015625, -3.060546875, 3.98046875, 11.021484375, 18.0625, 25.103515625, 32.14453125, 39.185546875, 46.2265625, 53.267578125, 60.30859375, 67.349609375, 74.390625, 81.431640625, 88.47265625, 95.513671875, 102.5546875, 109.595703125, 116.63671875, 123.677734375, 130.71875, 137.759765625, 144.80078125, 151.841796875, 158.8828125, 165.923828125, 172.96484375, 180.005859375, 187.046875, 194.087890625, 201.12890625, 208.169921875, 215.2109375, 222.251953125, 229.29296875, 236.333984375, 243.375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 8.0, 1.0, 3.0, 4.0, 8.0, 15.0, 12.0, 26.0, 36.0, 57.0, 74.0, 131.0, 224.0, 536.0, 1524.0, 8020.0, 337366.0, 687427.0, 10080.0, 1742.0, 624.0, 237.0, 144.0, 66.0, 48.0, 33.0, 31.0, 21.0, 7.0, 12.0, 10.0, 6.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-228.625, -221.70703125, -214.7890625, -207.87109375, -200.953125, -194.03515625, -187.1171875, -180.19921875, -173.28125, -166.36328125, -159.4453125, -152.52734375, -145.609375, -138.69140625, -131.7734375, -124.85546875, -117.9375, -111.01953125, -104.1015625, -97.18359375, -90.265625, -83.34765625, -76.4296875, -69.51171875, -62.59375, -55.67578125, -48.7578125, -41.83984375, -34.921875, -28.00390625, -21.0859375, -14.16796875, -7.25, -0.33203125, 6.5859375, 13.50390625, 20.421875, 27.33984375, 34.2578125, 41.17578125, 48.09375, 55.01171875, 61.9296875, 68.84765625, 75.765625, 82.68359375, 89.6015625, 96.51953125, 103.4375, 110.35546875, 117.2734375, 124.19140625, 131.109375, 138.02734375, 144.9453125, 151.86328125, 158.78125, 165.69921875, 172.6171875, 179.53515625, 186.453125, 193.37109375, 200.2890625, 207.20703125, 214.125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 6.0, 6.0, 6.0, 8.0, 13.0, 20.0, 21.0, 32.0, 55.0, 84.0, 127.0, 161.0, 127.0, 120.0, 63.0, 40.0, 38.0, 15.0, 18.0, 9.0, 6.0, 10.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0159454345703125, -0.015372514724731445, -0.01479959487915039, -0.014226675033569336, -0.013653755187988281, -0.013080835342407227, -0.012507915496826172, -0.011934995651245117, -0.011362075805664062, -0.010789155960083008, -0.010216236114501953, -0.009643316268920898, -0.009070396423339844, -0.008497476577758789, -0.007924556732177734, -0.00735163688659668, -0.006778717041015625, -0.00620579719543457, -0.005632877349853516, -0.005059957504272461, -0.004487037658691406, -0.0039141178131103516, -0.003341197967529297, -0.002768278121948242, -0.0021953582763671875, -0.0016224384307861328, -0.0010495185852050781, -0.00047659873962402344, 9.632110595703125e-05, 0.0006692409515380859, 0.0012421607971191406, 0.0018150806427001953, 0.00238800048828125, 0.0029609203338623047, 0.0035338401794433594, 0.004106760025024414, 0.004679679870605469, 0.0052525997161865234, 0.005825519561767578, 0.006398439407348633, 0.0069713592529296875, 0.007544279098510742, 0.008117198944091797, 0.008690118789672852, 0.009263038635253906, 0.009835958480834961, 0.010408878326416016, 0.01098179817199707, 0.011554718017578125, 0.01212763786315918, 0.012700557708740234, 0.013273477554321289, 0.013846397399902344, 0.014419317245483398, 0.014992237091064453, 0.015565156936645508, 0.016138076782226562, 0.016710996627807617, 0.017283916473388672, 0.017856836318969727, 0.01842975616455078, 0.019002676010131836, 0.01957559585571289, 0.020148515701293945, 0.020721435546875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 4.0, 12.0, 13.0, 12.0, 21.0, 21.0, 39.0, 73.0, 74.0, 114.0, 189.0, 355.0, 617.0, 1258.0, 2940.0, 8439.0, 47837.0, 915609.0, 55924.0, 9074.0, 3010.0, 1325.0, 618.0, 351.0, 219.0, 121.0, 82.0, 63.0, 43.0, 36.0, 9.0, 15.0, 8.0, 7.0, 6.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-166.875, -161.025390625, -155.17578125, -149.326171875, -143.4765625, -137.626953125, -131.77734375, -125.927734375, -120.078125, -114.228515625, -108.37890625, -102.529296875, -96.6796875, -90.830078125, -84.98046875, -79.130859375, -73.28125, -67.431640625, -61.58203125, -55.732421875, -49.8828125, -44.033203125, -38.18359375, -32.333984375, -26.484375, -20.634765625, -14.78515625, -8.935546875, -3.0859375, 2.763671875, 8.61328125, 14.462890625, 20.3125, 26.162109375, 32.01171875, 37.861328125, 43.7109375, 49.560546875, 55.41015625, 61.259765625, 67.109375, 72.958984375, 78.80859375, 84.658203125, 90.5078125, 96.357421875, 102.20703125, 108.056640625, 113.90625, 119.755859375, 125.60546875, 131.455078125, 137.3046875, 143.154296875, 149.00390625, 154.853515625, 160.703125, 166.552734375, 172.40234375, 178.251953125, 184.1015625, 189.951171875, 195.80078125, 201.650390625, 207.5]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 5.0, 0.0, 2.0, 6.0, 12.0, 12.0, 16.0, 55.0, 133.0, 297.0, 255.0, 113.0, 44.0, 20.0, 12.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-311.0, -302.568359375, -294.13671875, -285.705078125, -277.2734375, -268.841796875, -260.41015625, -251.978515625, -243.546875, -235.115234375, -226.68359375, -218.251953125, -209.8203125, -201.388671875, -192.95703125, -184.525390625, -176.09375, -167.662109375, -159.23046875, -150.798828125, -142.3671875, -133.935546875, -125.50390625, -117.072265625, -108.640625, -100.208984375, -91.77734375, -83.345703125, -74.9140625, -66.482421875, -58.05078125, -49.619140625, -41.1875, -32.755859375, -24.32421875, -15.892578125, -7.4609375, 0.970703125, 9.40234375, 17.833984375, 26.265625, 34.697265625, 43.12890625, 51.560546875, 59.9921875, 68.423828125, 76.85546875, 85.287109375, 93.71875, 102.150390625, 110.58203125, 119.013671875, 127.4453125, 135.876953125, 144.30859375, 152.740234375, 161.171875, 169.603515625, 178.03515625, 186.466796875, 194.8984375, 203.330078125, 211.76171875, 220.193359375, 228.625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 13.0, 50.0, 348.0, 492.0, 74.0, 13.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5615.1923828125, -5415.76611328125, -5216.33935546875, -5016.9130859375, -4817.486328125, -4618.06005859375, -4418.6337890625, -4219.20703125, -4019.78076171875, -3820.354248046875, -3620.927734375, -3421.50146484375, -3222.074951171875, -3022.6484375, -2823.22216796875, -2623.795654296875, -2424.369140625, -2224.942626953125, -2025.5162353515625, -1826.08984375, -1626.663330078125, -1427.23681640625, -1227.8104248046875, -1028.384033203125, -828.95751953125, -629.5310668945312, -430.1046142578125, -230.67816162109375, -31.251708984375, 168.17474365234375, 367.6011962890625, 567.027587890625, 766.45458984375, 965.8810424804688, 1165.3074951171875, 1364.73388671875, 1564.160400390625, 1763.5869140625, 1963.0133056640625, 2162.439697265625, 2361.8662109375, 2561.292724609375, 2760.71923828125, 2960.1455078125, 3159.572021484375, 3358.99853515625, 3558.4248046875, 3757.851318359375, 3957.27783203125, 4156.7041015625, 4356.130859375, 4555.55712890625, 4754.9833984375, 4954.41015625, 5153.83642578125, 5353.2626953125, 5552.689453125, 5752.11572265625, 5951.54248046875, 6150.96875, 6350.3955078125, 6549.82177734375, 6749.248046875, 6948.6748046875, 7148.10107421875]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 9.0, 4.0, 6.0, 11.0, 9.0, 16.0, 20.0, 16.0, 30.0, 47.0, 41.0, 36.0, 49.0, 60.0, 69.0, 49.0, 75.0, 56.0, 63.0, 47.0, 46.0, 43.0, 39.0, 32.0, 36.0, 20.0, 27.0, 17.0, 12.0, 11.0, 2.0, 4.0, 0.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1326.891357421875, -1286.4144287109375, -1245.9375, -1205.4605712890625, -1164.983642578125, -1124.5067138671875, -1084.02978515625, -1043.552978515625, -1003.0759887695312, -962.5990600585938, -922.1221313476562, -881.6452026367188, -841.1683349609375, -800.69140625, -760.2144775390625, -719.737548828125, -679.2606201171875, -638.78369140625, -598.3067626953125, -557.829833984375, -517.3529052734375, -476.8760070800781, -436.39910888671875, -395.92218017578125, -355.44525146484375, -314.96832275390625, -274.49139404296875, -234.01449584960938, -193.53756713867188, -153.06063842773438, -112.58372497558594, -72.1068115234375, -31.6297607421875, 8.847160339355469, 49.32408142089844, 89.8010025024414, 130.27792358398438, 170.75485229492188, 211.2317657470703, 251.70867919921875, 292.18560791015625, 332.66253662109375, 373.13946533203125, 413.6163635253906, 454.0932922363281, 494.5702209472656, 535.047119140625, 575.5240478515625, 616.0009765625, 656.4779052734375, 696.954833984375, 737.4317626953125, 777.90869140625, 818.3856201171875, 858.8624877929688, 899.3394165039062, 939.8163452148438, 980.2932739257812, 1020.7702026367188, 1061.2470703125, 1101.7239990234375, 1142.200927734375, 1182.6778564453125, 1223.15478515625, 1263.6317138671875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 10.0, 5.0, 21.0, 21.0, 48.0, 74.0, 128.0, 268.0, 586.0, 1489.0, 4935.0, 30385.0, 4003480.0, 138036.0, 10293.0, 2597.0, 933.0, 435.0, 219.0, 114.0, 66.0, 43.0, 27.0, 22.0, 17.0, 5.0, 6.0, 5.0, 6.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-223.375, -215.021484375, -206.66796875, -198.314453125, -189.9609375, -181.607421875, -173.25390625, -164.900390625, -156.546875, -148.193359375, -139.83984375, -131.486328125, -123.1328125, -114.779296875, -106.42578125, -98.072265625, -89.71875, -81.365234375, -73.01171875, -64.658203125, -56.3046875, -47.951171875, -39.59765625, -31.244140625, -22.890625, -14.537109375, -6.18359375, 2.169921875, 10.5234375, 18.876953125, 27.23046875, 35.583984375, 43.9375, 52.291015625, 60.64453125, 68.998046875, 77.3515625, 85.705078125, 94.05859375, 102.412109375, 110.765625, 119.119140625, 127.47265625, 135.826171875, 144.1796875, 152.533203125, 160.88671875, 169.240234375, 177.59375, 185.947265625, 194.30078125, 202.654296875, 211.0078125, 219.361328125, 227.71484375, 236.068359375, 244.421875, 252.775390625, 261.12890625, 269.482421875, 277.8359375, 286.189453125, 294.54296875, 302.896484375, 311.25]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 6.0, 13.0, 24.0, 28.0, 44.0, 67.0, 83.0, 98.0, 134.0, 110.0, 93.0, 82.0, 74.0, 39.0, 42.0, 15.0, 14.0, 11.0, 4.0, 3.0, 6.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.28125, -51.71142578125, -49.1416015625, -46.57177734375, -44.001953125, -41.43212890625, -38.8623046875, -36.29248046875, -33.72265625, -31.15283203125, -28.5830078125, -26.01318359375, -23.443359375, -20.87353515625, -18.3037109375, -15.73388671875, -13.1640625, -10.59423828125, -8.0244140625, -5.45458984375, -2.884765625, -0.31494140625, 2.2548828125, 4.82470703125, 7.39453125, 9.96435546875, 12.5341796875, 15.10400390625, 17.673828125, 20.24365234375, 22.8134765625, 25.38330078125, 27.953125, 30.52294921875, 33.0927734375, 35.66259765625, 38.232421875, 40.80224609375, 43.3720703125, 45.94189453125, 48.51171875, 51.08154296875, 53.6513671875, 56.22119140625, 58.791015625, 61.36083984375, 63.9306640625, 66.50048828125, 69.0703125, 71.64013671875, 74.2099609375, 76.77978515625, 79.349609375, 81.91943359375, 84.4892578125, 87.05908203125, 89.62890625, 92.19873046875, 94.7685546875, 97.33837890625, 99.908203125, 102.47802734375, 105.0478515625, 107.61767578125, 110.1875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 7.0, 5.0, 12.0, 12.0, 19.0, 30.0, 51.0, 87.0, 138.0, 196.0, 446.0, 876.0, 2277.0, 8314.0, 52938.0, 3952632.0, 155657.0, 14679.0, 3521.0, 1208.0, 518.0, 256.0, 153.0, 75.0, 46.0, 42.0, 24.0, 23.0, 8.0, 10.0, 7.0, 2.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-262.25, -254.6875, -247.125, -239.5625, -232.0, -224.4375, -216.875, -209.3125, -201.75, -194.1875, -186.625, -179.0625, -171.5, -163.9375, -156.375, -148.8125, -141.25, -133.6875, -126.125, -118.5625, -111.0, -103.4375, -95.875, -88.3125, -80.75, -73.1875, -65.625, -58.0625, -50.5, -42.9375, -35.375, -27.8125, -20.25, -12.6875, -5.125, 2.4375, 10.0, 17.5625, 25.125, 32.6875, 40.25, 47.8125, 55.375, 62.9375, 70.5, 78.0625, 85.625, 93.1875, 100.75, 108.3125, 115.875, 123.4375, 131.0, 138.5625, 146.125, 153.6875, 161.25, 168.8125, 176.375, 183.9375, 191.5, 199.0625, 206.625, 214.1875, 221.75]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 6.0, 6.0, 8.0, 13.0, 19.0, 41.0, 55.0, 174.0, 795.0, 2361.0, 380.0, 83.0, 49.0, 21.0, 22.0, 9.0, 7.0, 9.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-240.75, -232.79296875, -224.8359375, -216.87890625, -208.921875, -200.96484375, -193.0078125, -185.05078125, -177.09375, -169.13671875, -161.1796875, -153.22265625, -145.265625, -137.30859375, -129.3515625, -121.39453125, -113.4375, -105.48046875, -97.5234375, -89.56640625, -81.609375, -73.65234375, -65.6953125, -57.73828125, -49.78125, -41.82421875, -33.8671875, -25.91015625, -17.953125, -9.99609375, -2.0390625, 5.91796875, 13.875, 21.83203125, 29.7890625, 37.74609375, 45.703125, 53.66015625, 61.6171875, 69.57421875, 77.53125, 85.48828125, 93.4453125, 101.40234375, 109.359375, 117.31640625, 125.2734375, 133.23046875, 141.1875, 149.14453125, 157.1015625, 165.05859375, 173.015625, 180.97265625, 188.9296875, 196.88671875, 204.84375, 212.80078125, 220.7578125, 228.71484375, 236.671875, 244.62890625, 252.5859375, 260.54296875, 268.5]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 8.0, 11.0, 25.0, 63.0, 201.0, 312.0, 218.0, 100.0, 30.0, 23.0, 5.0, 5.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-570.9722290039062, -511.0196228027344, -451.0670166015625, -391.1143798828125, -331.16180419921875, -271.20916748046875, -211.25656127929688, -151.303955078125, -91.35134887695312, -31.398738861083984, 28.553871154785156, 88.50648498535156, 148.45909118652344, 208.41171264648438, 268.36431884765625, 328.3169250488281, 388.26953125, 448.2221374511719, 508.17474365234375, 568.1273803710938, 628.0799560546875, 688.0325927734375, 747.9852294921875, 807.9378051757812, 867.890380859375, 927.843017578125, 987.7955932617188, 1047.7481689453125, 1107.7008056640625, 1167.6534423828125, 1227.6060791015625, 1287.55859375, 1347.5113525390625, 1407.4639892578125, 1467.4166259765625, 1527.369140625, 1587.32177734375, 1647.2744140625, 1707.22705078125, 1767.1796875, 1827.1322021484375, 1887.0848388671875, 1947.0374755859375, 2006.989990234375, 2066.942626953125, 2126.895263671875, 2186.847900390625, 2246.800537109375, 2306.753173828125, 2366.705810546875, 2426.658447265625, 2486.611083984375, 2546.563720703125, 2606.51611328125, 2666.46875, 2726.42138671875, 2786.3740234375, 2846.32666015625, 2906.279296875, 2966.23193359375, 3026.1845703125, 3086.13720703125, 3146.089599609375, 3206.042236328125, 3265.994873046875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 2.0, 3.0, 11.0, 8.0, 11.0, 20.0, 13.0, 9.0, 16.0, 24.0, 25.0, 27.0, 40.0, 29.0, 42.0, 37.0, 46.0, 38.0, 46.0, 53.0, 58.0, 40.0, 53.0, 40.0, 50.0, 30.0, 43.0, 27.0, 30.0, 23.0, 20.0, 18.0, 19.0, 9.0, 11.0, 10.0, 2.0, 6.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-589.9921875, -572.6132202148438, -555.2342529296875, -537.855224609375, -520.4762573242188, -503.0972900390625, -485.71832275390625, -468.33935546875, -450.96038818359375, -433.5814208984375, -416.2024230957031, -398.8234558105469, -381.4444885253906, -364.06549072265625, -346.6865234375, -329.30755615234375, -311.9285583496094, -294.5495910644531, -277.17059326171875, -259.7916259765625, -242.41265869140625, -225.03367614746094, -207.65469360351562, -190.27572631835938, -172.89674377441406, -155.51776123046875, -138.1387939453125, -120.75981140136719, -103.3808364868164, -86.00186157226562, -68.62287902832031, -51.24390411376953, -33.86492919921875, -16.485952377319336, 0.8930244445800781, 18.272003173828125, 35.650978088378906, 53.02995300292969, 70.408935546875, 87.78791046142578, 105.16688537597656, 122.54586029052734, 139.92483520507812, 157.30381774902344, 174.68280029296875, 192.061767578125, 209.4407501220703, 226.81973266601562, 244.19869995117188, 261.5776672363281, 278.9566650390625, 296.33563232421875, 313.714599609375, 331.09356689453125, 348.4725646972656, 365.8515319824219, 383.23052978515625, 400.6094970703125, 417.9884948730469, 435.3674621582031, 452.7464294433594, 470.12542724609375, 487.50439453125, 504.88336181640625, 522.2623291015625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 9.0, 8.0, 18.0, 17.0, 31.0, 33.0, 50.0, 83.0, 101.0, 167.0, 274.0, 484.0, 903.0, 1588.0, 3461.0, 8388.0, 22537.0, 79815.0, 389043.0, 416635.0, 84960.0, 23916.0, 8580.0, 3540.0, 1687.0, 848.0, 487.0, 286.0, 193.0, 120.0, 78.0, 51.0, 33.0, 29.0, 23.0, 19.0, 8.0, 4.0, 10.0, 9.0, 8.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-153.5, -148.98828125, -144.4765625, -139.96484375, -135.453125, -130.94140625, -126.4296875, -121.91796875, -117.40625, -112.89453125, -108.3828125, -103.87109375, -99.359375, -94.84765625, -90.3359375, -85.82421875, -81.3125, -76.80078125, -72.2890625, -67.77734375, -63.265625, -58.75390625, -54.2421875, -49.73046875, -45.21875, -40.70703125, -36.1953125, -31.68359375, -27.171875, -22.66015625, -18.1484375, -13.63671875, -9.125, -4.61328125, -0.1015625, 4.41015625, 8.921875, 13.43359375, 17.9453125, 22.45703125, 26.96875, 31.48046875, 35.9921875, 40.50390625, 45.015625, 49.52734375, 54.0390625, 58.55078125, 63.0625, 67.57421875, 72.0859375, 76.59765625, 81.109375, 85.62109375, 90.1328125, 94.64453125, 99.15625, 103.66796875, 108.1796875, 112.69140625, 117.203125, 121.71484375, 126.2265625, 130.73828125, 135.25]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 5.0, 6.0, 2.0, 12.0, 12.0, 18.0, 31.0, 38.0, 65.0, 63.0, 84.0, 94.0, 85.0, 85.0, 87.0, 81.0, 50.0, 55.0, 45.0, 28.0, 20.0, 14.0, 6.0, 5.0, 8.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.125, -50.9052734375, -48.685546875, -46.4658203125, -44.24609375, -42.0263671875, -39.806640625, -37.5869140625, -35.3671875, -33.1474609375, -30.927734375, -28.7080078125, -26.48828125, -24.2685546875, -22.048828125, -19.8291015625, -17.609375, -15.3896484375, -13.169921875, -10.9501953125, -8.73046875, -6.5107421875, -4.291015625, -2.0712890625, 0.1484375, 2.3681640625, 4.587890625, 6.8076171875, 9.02734375, 11.2470703125, 13.466796875, 15.6865234375, 17.90625, 20.1259765625, 22.345703125, 24.5654296875, 26.78515625, 29.0048828125, 31.224609375, 33.4443359375, 35.6640625, 37.8837890625, 40.103515625, 42.3232421875, 44.54296875, 46.7626953125, 48.982421875, 51.2021484375, 53.421875, 55.6416015625, 57.861328125, 60.0810546875, 62.30078125, 64.5205078125, 66.740234375, 68.9599609375, 71.1796875, 73.3994140625, 75.619140625, 77.8388671875, 80.05859375, 82.2783203125, 84.498046875, 86.7177734375, 88.9375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 1.0, 4.0, 10.0, 10.0, 16.0, 19.0, 14.0, 38.0, 50.0, 71.0, 116.0, 163.0, 262.0, 490.0, 839.0, 1861.0, 4792.0, 18595.0, 169314.0, 771914.0, 63207.0, 10456.0, 3168.0, 1391.0, 683.0, 371.0, 226.0, 145.0, 94.0, 69.0, 36.0, 29.0, 24.0, 15.0, 17.0, 7.0, 8.0, 6.0, 7.0, 3.0, 2.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-274.75, -266.24609375, -257.7421875, -249.23828125, -240.734375, -232.23046875, -223.7265625, -215.22265625, -206.71875, -198.21484375, -189.7109375, -181.20703125, -172.703125, -164.19921875, -155.6953125, -147.19140625, -138.6875, -130.18359375, -121.6796875, -113.17578125, -104.671875, -96.16796875, -87.6640625, -79.16015625, -70.65625, -62.15234375, -53.6484375, -45.14453125, -36.640625, -28.13671875, -19.6328125, -11.12890625, -2.625, 5.87890625, 14.3828125, 22.88671875, 31.390625, 39.89453125, 48.3984375, 56.90234375, 65.40625, 73.91015625, 82.4140625, 90.91796875, 99.421875, 107.92578125, 116.4296875, 124.93359375, 133.4375, 141.94140625, 150.4453125, 158.94921875, 167.453125, 175.95703125, 184.4609375, 192.96484375, 201.46875, 209.97265625, 218.4765625, 226.98046875, 235.484375, 243.98828125, 252.4921875, 260.99609375, 269.5]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 7.0, 12.0, 9.0, 12.0, 18.0, 28.0, 25.0, 35.0, 41.0, 57.0, 65.0, 64.0, 63.0, 71.0, 69.0, 72.0, 72.0, 52.0, 43.0, 44.0, 29.0, 23.0, 21.0, 12.0, 12.0, 11.0, 11.0, 4.0, 6.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-264.25, -254.30078125, -244.3515625, -234.40234375, -224.453125, -214.50390625, -204.5546875, -194.60546875, -184.65625, -174.70703125, -164.7578125, -154.80859375, -144.859375, -134.91015625, -124.9609375, -115.01171875, -105.0625, -95.11328125, -85.1640625, -75.21484375, -65.265625, -55.31640625, -45.3671875, -35.41796875, -25.46875, -15.51953125, -5.5703125, 4.37890625, 14.328125, 24.27734375, 34.2265625, 44.17578125, 54.125, 64.07421875, 74.0234375, 83.97265625, 93.921875, 103.87109375, 113.8203125, 123.76953125, 133.71875, 143.66796875, 153.6171875, 163.56640625, 173.515625, 183.46484375, 193.4140625, 203.36328125, 213.3125, 223.26171875, 233.2109375, 243.16015625, 253.109375, 263.05859375, 273.0078125, 282.95703125, 292.90625, 302.85546875, 312.8046875, 322.75390625, 332.703125, 342.65234375, 352.6015625, 362.55078125, 372.5]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 9.0, 6.0, 6.0, 9.0, 8.0, 19.0, 23.0, 41.0, 48.0, 78.0, 174.0, 327.0, 723.0, 2179.0, 13243.0, 897868.0, 125474.0, 5868.0, 1342.0, 505.0, 257.0, 136.0, 70.0, 36.0, 31.0, 19.0, 14.0, 12.0, 5.0, 2.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-280.25, -272.19921875, -264.1484375, -256.09765625, -248.046875, -239.99609375, -231.9453125, -223.89453125, -215.84375, -207.79296875, -199.7421875, -191.69140625, -183.640625, -175.58984375, -167.5390625, -159.48828125, -151.4375, -143.38671875, -135.3359375, -127.28515625, -119.234375, -111.18359375, -103.1328125, -95.08203125, -87.03125, -78.98046875, -70.9296875, -62.87890625, -54.828125, -46.77734375, -38.7265625, -30.67578125, -22.625, -14.57421875, -6.5234375, 1.52734375, 9.578125, 17.62890625, 25.6796875, 33.73046875, 41.78125, 49.83203125, 57.8828125, 65.93359375, 73.984375, 82.03515625, 90.0859375, 98.13671875, 106.1875, 114.23828125, 122.2890625, 130.33984375, 138.390625, 146.44140625, 154.4921875, 162.54296875, 170.59375, 178.64453125, 186.6953125, 194.74609375, 202.796875, 210.84765625, 218.8984375, 226.94921875, 235.0]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 7.0, 13.0, 20.0, 19.0, 50.0, 74.0, 85.0, 156.0, 200.0, 138.0, 101.0, 47.0, 24.0, 13.0, 11.0, 14.0, 6.0, 5.0, 6.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03118896484375, -0.03035116195678711, -0.02951335906982422, -0.028675556182861328, -0.027837753295898438, -0.026999950408935547, -0.026162147521972656, -0.025324344635009766, -0.024486541748046875, -0.023648738861083984, -0.022810935974121094, -0.021973133087158203, -0.021135330200195312, -0.020297527313232422, -0.01945972442626953, -0.01862192153930664, -0.01778411865234375, -0.01694631576538086, -0.01610851287841797, -0.015270709991455078, -0.014432907104492188, -0.013595104217529297, -0.012757301330566406, -0.011919498443603516, -0.011081695556640625, -0.010243892669677734, -0.009406089782714844, -0.008568286895751953, -0.0077304840087890625, -0.006892681121826172, -0.006054878234863281, -0.005217075347900391, -0.0043792724609375, -0.0035414695739746094, -0.0027036666870117188, -0.0018658638000488281, -0.0010280609130859375, -0.00019025802612304688, 0.0006475448608398438, 0.0014853477478027344, 0.002323150634765625, 0.0031609535217285156, 0.003998756408691406, 0.004836559295654297, 0.0056743621826171875, 0.006512165069580078, 0.007349967956542969, 0.00818777084350586, 0.00902557373046875, 0.00986337661743164, 0.010701179504394531, 0.011538982391357422, 0.012376785278320312, 0.013214588165283203, 0.014052391052246094, 0.014890193939208984, 0.015727996826171875, 0.016565799713134766, 0.017403602600097656, 0.018241405487060547, 0.019079208374023438, 0.019917011260986328, 0.02075481414794922, 0.02159261703491211, 0.022430419921875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 8.0, 5.0, 7.0, 7.0, 10.0, 20.0, 11.0, 29.0, 37.0, 36.0, 77.0, 107.0, 146.0, 226.0, 350.0, 544.0, 893.0, 1968.0, 4501.0, 14618.0, 80342.0, 804202.0, 112886.0, 17431.0, 5249.0, 2062.0, 1112.0, 607.0, 342.0, 227.0, 144.0, 95.0, 70.0, 58.0, 33.0, 23.0, 12.0, 15.0, 16.0, 14.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-105.5, -102.2607421875, -99.021484375, -95.7822265625, -92.54296875, -89.3037109375, -86.064453125, -82.8251953125, -79.5859375, -76.3466796875, -73.107421875, -69.8681640625, -66.62890625, -63.3896484375, -60.150390625, -56.9111328125, -53.671875, -50.4326171875, -47.193359375, -43.9541015625, -40.71484375, -37.4755859375, -34.236328125, -30.9970703125, -27.7578125, -24.5185546875, -21.279296875, -18.0400390625, -14.80078125, -11.5615234375, -8.322265625, -5.0830078125, -1.84375, 1.3955078125, 4.634765625, 7.8740234375, 11.11328125, 14.3525390625, 17.591796875, 20.8310546875, 24.0703125, 27.3095703125, 30.548828125, 33.7880859375, 37.02734375, 40.2666015625, 43.505859375, 46.7451171875, 49.984375, 53.2236328125, 56.462890625, 59.7021484375, 62.94140625, 66.1806640625, 69.419921875, 72.6591796875, 75.8984375, 79.1376953125, 82.376953125, 85.6162109375, 88.85546875, 92.0947265625, 95.333984375, 98.5732421875, 101.8125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 6.0, 1.0, 4.0, 11.0, 12.0, 17.0, 9.0, 12.0, 21.0, 21.0, 37.0, 50.0, 79.0, 104.0, 116.0, 118.0, 96.0, 75.0, 60.0, 40.0, 21.0, 15.0, 16.0, 9.0, 9.0, 8.0, 6.0, 3.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-121.75, -118.05859375, -114.3671875, -110.67578125, -106.984375, -103.29296875, -99.6015625, -95.91015625, -92.21875, -88.52734375, -84.8359375, -81.14453125, -77.453125, -73.76171875, -70.0703125, -66.37890625, -62.6875, -58.99609375, -55.3046875, -51.61328125, -47.921875, -44.23046875, -40.5390625, -36.84765625, -33.15625, -29.46484375, -25.7734375, -22.08203125, -18.390625, -14.69921875, -11.0078125, -7.31640625, -3.625, 0.06640625, 3.7578125, 7.44921875, 11.140625, 14.83203125, 18.5234375, 22.21484375, 25.90625, 29.59765625, 33.2890625, 36.98046875, 40.671875, 44.36328125, 48.0546875, 51.74609375, 55.4375, 59.12890625, 62.8203125, 66.51171875, 70.203125, 73.89453125, 77.5859375, 81.27734375, 84.96875, 88.66015625, 92.3515625, 96.04296875, 99.734375, 103.42578125, 107.1171875, 110.80859375, 114.5]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 8.0, 11.0, 54.0, 138.0, 266.0, 273.0, 142.0, 56.0, 28.0, 9.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2462.260986328125, -2370.650146484375, -2279.03955078125, -2187.4287109375, -2095.818115234375, -2004.2073974609375, -1912.5966796875, -1820.98583984375, -1729.375244140625, -1637.7645263671875, -1546.15380859375, -1454.5430908203125, -1362.932373046875, -1271.3216552734375, -1179.7109375, -1088.10009765625, -996.4893798828125, -904.878662109375, -813.2679443359375, -721.6572265625, -630.0465087890625, -538.435791015625, -446.82501220703125, -355.21429443359375, -263.60357666015625, -171.99285888671875, -80.38212585449219, 11.228607177734375, 102.83932495117188, 194.45004272460938, 286.060791015625, 377.6715087890625, 469.2822265625, 560.8929443359375, 652.503662109375, 744.1143798828125, 835.72509765625, 927.3358154296875, 1018.9465942382812, 1110.557373046875, 1202.16796875, 1293.7786865234375, 1385.389404296875, 1477.0001220703125, 1568.61083984375, 1660.2215576171875, 1751.832275390625, 1843.443115234375, 1935.0538330078125, 2026.66455078125, 2118.275390625, 2209.885986328125, 2301.496826171875, 2393.107421875, 2484.71826171875, 2576.328857421875, 2667.939697265625, 2759.550537109375, 2851.1611328125, 2942.77197265625, 3034.382568359375, 3125.993408203125, 3217.60400390625, 3309.21484375, 3400.825439453125]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 6.0, 7.0, 9.0, 9.0, 19.0, 17.0, 27.0, 27.0, 48.0, 38.0, 45.0, 40.0, 56.0, 57.0, 76.0, 75.0, 65.0, 77.0, 43.0, 47.0, 42.0, 28.0, 33.0, 30.0, 17.0, 7.0, 18.0, 13.0, 4.0, 8.0, 7.0, 3.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1112.8363037109375, -1075.85400390625, -1038.8717041015625, -1001.8893432617188, -964.9070434570312, -927.9247436523438, -890.9423828125, -853.9600830078125, -816.977783203125, -779.9954833984375, -743.01318359375, -706.0308227539062, -669.0485229492188, -632.0662231445312, -595.0838623046875, -558.1015625, -521.1192626953125, -484.136962890625, -447.1546325683594, -410.17230224609375, -373.19000244140625, -336.20770263671875, -299.2253723144531, -262.2430419921875, -225.2607421875, -188.27842712402344, -151.29611206054688, -114.31379699707031, -77.33148193359375, -40.34916687011719, -3.366851806640625, 33.615478515625, 70.597900390625, 107.58021545410156, 144.56253051757812, 181.5448455810547, 218.52716064453125, 255.5094757080078, 292.4917907714844, 329.47412109375, 366.4564208984375, 403.438720703125, 440.4210510253906, 477.40338134765625, 514.3856811523438, 551.3679809570312, 588.350341796875, 625.3326416015625, 662.31494140625, 699.2972412109375, 736.279541015625, 773.2619018554688, 810.2442016601562, 847.2265014648438, 884.2088623046875, 921.191162109375, 958.1734619140625, 995.15576171875, 1032.1380615234375, 1069.120361328125, 1106.102783203125, 1143.0850830078125, 1180.0673828125, 1217.0496826171875, 1254.031982421875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 6.0, 7.0, 18.0, 12.0, 19.0, 34.0, 62.0, 78.0, 136.0, 246.0, 471.0, 989.0, 2300.0, 6534.0, 23289.0, 224631.0, 3845440.0, 68847.0, 12762.0, 4335.0, 1764.0, 866.0, 490.0, 296.0, 203.0, 117.0, 80.0, 54.0, 37.0, 29.0, 19.0, 17.0, 21.0, 9.0, 12.0, 12.0, 6.0, 3.0, 8.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-157.125, -152.265625, -147.40625, -142.546875, -137.6875, -132.828125, -127.96875, -123.109375, -118.25, -113.390625, -108.53125, -103.671875, -98.8125, -93.953125, -89.09375, -84.234375, -79.375, -74.515625, -69.65625, -64.796875, -59.9375, -55.078125, -50.21875, -45.359375, -40.5, -35.640625, -30.78125, -25.921875, -21.0625, -16.203125, -11.34375, -6.484375, -1.625, 3.234375, 8.09375, 12.953125, 17.8125, 22.671875, 27.53125, 32.390625, 37.25, 42.109375, 46.96875, 51.828125, 56.6875, 61.546875, 66.40625, 71.265625, 76.125, 80.984375, 85.84375, 90.703125, 95.5625, 100.421875, 105.28125, 110.140625, 115.0, 119.859375, 124.71875, 129.578125, 134.4375, 139.296875, 144.15625, 149.015625, 153.875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 5.0, 8.0, 19.0, 24.0, 55.0, 85.0, 116.0, 147.0, 145.0, 110.0, 92.0, 85.0, 44.0, 31.0, 15.0, 9.0, 5.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-65.0, -61.68359375, -58.3671875, -55.05078125, -51.734375, -48.41796875, -45.1015625, -41.78515625, -38.46875, -35.15234375, -31.8359375, -28.51953125, -25.203125, -21.88671875, -18.5703125, -15.25390625, -11.9375, -8.62109375, -5.3046875, -1.98828125, 1.328125, 4.64453125, 7.9609375, 11.27734375, 14.59375, 17.91015625, 21.2265625, 24.54296875, 27.859375, 31.17578125, 34.4921875, 37.80859375, 41.125, 44.44140625, 47.7578125, 51.07421875, 54.390625, 57.70703125, 61.0234375, 64.33984375, 67.65625, 70.97265625, 74.2890625, 77.60546875, 80.921875, 84.23828125, 87.5546875, 90.87109375, 94.1875, 97.50390625, 100.8203125, 104.13671875, 107.453125, 110.76953125, 114.0859375, 117.40234375, 120.71875, 124.03515625, 127.3515625, 130.66796875, 133.984375, 137.30078125, 140.6171875, 143.93359375, 147.25]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 11.0, 4.0, 25.0, 22.0, 38.0, 47.0, 84.0, 105.0, 171.0, 264.0, 511.0, 945.0, 1764.0, 3775.0, 9020.0, 28743.0, 233701.0, 3760175.0, 120164.0, 20672.0, 7061.0, 3148.0, 1538.0, 822.0, 462.0, 276.0, 197.0, 146.0, 103.0, 76.0, 65.0, 41.0, 32.0, 31.0, 10.0, 11.0, 8.0, 2.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-134.375, -129.08203125, -123.7890625, -118.49609375, -113.203125, -107.91015625, -102.6171875, -97.32421875, -92.03125, -86.73828125, -81.4453125, -76.15234375, -70.859375, -65.56640625, -60.2734375, -54.98046875, -49.6875, -44.39453125, -39.1015625, -33.80859375, -28.515625, -23.22265625, -17.9296875, -12.63671875, -7.34375, -2.05078125, 3.2421875, 8.53515625, 13.828125, 19.12109375, 24.4140625, 29.70703125, 35.0, 40.29296875, 45.5859375, 50.87890625, 56.171875, 61.46484375, 66.7578125, 72.05078125, 77.34375, 82.63671875, 87.9296875, 93.22265625, 98.515625, 103.80859375, 109.1015625, 114.39453125, 119.6875, 124.98046875, 130.2734375, 135.56640625, 140.859375, 146.15234375, 151.4453125, 156.73828125, 162.03125, 167.32421875, 172.6171875, 177.91015625, 183.203125, 188.49609375, 193.7890625, 199.08203125, 204.375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 6.0, 5.0, 10.0, 21.0, 24.0, 36.0, 48.0, 96.0, 232.0, 715.0, 1696.0, 685.0, 226.0, 91.0, 54.0, 40.0, 13.0, 15.0, 9.0, 6.0, 5.0, 3.0, 7.0, 2.0, 6.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-137.0, -131.62109375, -126.2421875, -120.86328125, -115.484375, -110.10546875, -104.7265625, -99.34765625, -93.96875, -88.58984375, -83.2109375, -77.83203125, -72.453125, -67.07421875, -61.6953125, -56.31640625, -50.9375, -45.55859375, -40.1796875, -34.80078125, -29.421875, -24.04296875, -18.6640625, -13.28515625, -7.90625, -2.52734375, 2.8515625, 8.23046875, 13.609375, 18.98828125, 24.3671875, 29.74609375, 35.125, 40.50390625, 45.8828125, 51.26171875, 56.640625, 62.01953125, 67.3984375, 72.77734375, 78.15625, 83.53515625, 88.9140625, 94.29296875, 99.671875, 105.05078125, 110.4296875, 115.80859375, 121.1875, 126.56640625, 131.9453125, 137.32421875, 142.703125, 148.08203125, 153.4609375, 158.83984375, 164.21875, 169.59765625, 174.9765625, 180.35546875, 185.734375, 191.11328125, 196.4921875, 201.87109375, 207.25]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 7.0, 4.0, 11.0, 24.0, 87.0, 269.0, 352.0, 143.0, 58.0, 23.0, 13.0, 3.0, 8.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1440.9588623046875, -1365.5877685546875, -1290.216796875, -1214.845703125, -1139.474609375, -1064.103515625, -988.7325439453125, -913.3614501953125, -837.9904174804688, -762.619384765625, -687.248291015625, -611.8772583007812, -536.5062255859375, -461.1351318359375, -385.76409912109375, -310.39300537109375, -235.02197265625, -159.65090942382812, -84.27986145019531, -8.9088134765625, 66.46224975585938, 141.83331298828125, 217.204345703125, 292.575439453125, 367.94647216796875, 443.3175354003906, 518.6885986328125, 594.0596313476562, 669.4306640625, 744.8017578125, 820.1727905273438, 895.5438842773438, 970.914794921875, 1046.285888671875, 1121.6568603515625, 1197.0279541015625, 1272.3990478515625, 1347.77001953125, 1423.14111328125, 1498.51220703125, 1573.88330078125, 1649.25439453125, 1724.6253662109375, 1799.9964599609375, 1875.3675537109375, 1950.738525390625, 2026.109619140625, 2101.480712890625, 2176.8515625, 2252.22265625, 2327.59375, 2402.96484375, 2478.335693359375, 2553.706787109375, 2629.077880859375, 2704.448974609375, 2779.820068359375, 2855.191162109375, 2930.562255859375, 3005.93310546875, 3081.30419921875, 3156.67529296875, 3232.04638671875, 3307.41748046875, 3382.78857421875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 6.0, 2.0, 5.0, 6.0, 9.0, 15.0, 8.0, 19.0, 17.0, 25.0, 27.0, 32.0, 39.0, 42.0, 42.0, 49.0, 63.0, 50.0, 53.0, 48.0, 50.0, 64.0, 43.0, 46.0, 41.0, 29.0, 41.0, 28.0, 25.0, 20.0, 16.0, 8.0, 11.0, 6.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-895.2177734375, -871.6389770507812, -848.0601806640625, -824.4813842773438, -800.902587890625, -777.3237915039062, -753.7449951171875, -730.166259765625, -706.58740234375, -683.0086059570312, -659.4298095703125, -635.8510131835938, -612.272216796875, -588.6934204101562, -565.1146240234375, -541.535888671875, -517.9570922851562, -494.3782958984375, -470.79949951171875, -447.220703125, -423.64190673828125, -400.0631103515625, -376.4843444824219, -352.9055480957031, -329.3267517089844, -305.7479553222656, -282.1691589355469, -258.59039306640625, -235.01158142089844, -211.4327850341797, -187.85400390625, -164.27520751953125, -140.69647216796875, -117.11767578125, -93.53888702392578, -69.96009826660156, -46.38130187988281, -22.802505493164062, 0.776275634765625, 24.355072021484375, 47.933868408203125, 71.51266479492188, 95.0914535522461, 118.67024230957031, 142.24903869628906, 165.8278350830078, 189.4066162109375, 212.98541259765625, 236.564208984375, 260.14300537109375, 283.7218017578125, 307.30059814453125, 330.87939453125, 354.45819091796875, 378.0369567871094, 401.6157531738281, 425.1945495605469, 448.7733459472656, 472.3521423339844, 495.930908203125, 519.5097045898438, 543.0885009765625, 566.6672973632812, 590.24609375, 613.8248901367188]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 8.0, 7.0, 16.0, 18.0, 20.0, 32.0, 51.0, 95.0, 143.0, 279.0, 514.0, 1078.0, 2466.0, 6646.0, 21279.0, 86728.0, 524495.0, 324468.0, 56302.0, 15037.0, 4973.0, 1944.0, 897.0, 469.0, 249.0, 132.0, 77.0, 40.0, 31.0, 21.0, 14.0, 10.0, 7.0, 5.0, 2.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-186.125, -180.09375, -174.0625, -168.03125, -162.0, -155.96875, -149.9375, -143.90625, -137.875, -131.84375, -125.8125, -119.78125, -113.75, -107.71875, -101.6875, -95.65625, -89.625, -83.59375, -77.5625, -71.53125, -65.5, -59.46875, -53.4375, -47.40625, -41.375, -35.34375, -29.3125, -23.28125, -17.25, -11.21875, -5.1875, 0.84375, 6.875, 12.90625, 18.9375, 24.96875, 31.0, 37.03125, 43.0625, 49.09375, 55.125, 61.15625, 67.1875, 73.21875, 79.25, 85.28125, 91.3125, 97.34375, 103.375, 109.40625, 115.4375, 121.46875, 127.5, 133.53125, 139.5625, 145.59375, 151.625, 157.65625, 163.6875, 169.71875, 175.75, 181.78125, 187.8125, 193.84375, 199.875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 11.0, 13.0, 23.0, 19.0, 34.0, 42.0, 58.0, 73.0, 78.0, 89.0, 101.0, 84.0, 78.0, 75.0, 51.0, 47.0, 41.0, 23.0, 15.0, 17.0, 14.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.5, -63.802734375, -61.10546875, -58.408203125, -55.7109375, -53.013671875, -50.31640625, -47.619140625, -44.921875, -42.224609375, -39.52734375, -36.830078125, -34.1328125, -31.435546875, -28.73828125, -26.041015625, -23.34375, -20.646484375, -17.94921875, -15.251953125, -12.5546875, -9.857421875, -7.16015625, -4.462890625, -1.765625, 0.931640625, 3.62890625, 6.326171875, 9.0234375, 11.720703125, 14.41796875, 17.115234375, 19.8125, 22.509765625, 25.20703125, 27.904296875, 30.6015625, 33.298828125, 35.99609375, 38.693359375, 41.390625, 44.087890625, 46.78515625, 49.482421875, 52.1796875, 54.876953125, 57.57421875, 60.271484375, 62.96875, 65.666015625, 68.36328125, 71.060546875, 73.7578125, 76.455078125, 79.15234375, 81.849609375, 84.546875, 87.244140625, 89.94140625, 92.638671875, 95.3359375, 98.033203125, 100.73046875, 103.427734375, 106.125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 0.0, 5.0, 2.0, 4.0, 7.0, 12.0, 8.0, 14.0, 24.0, 19.0, 37.0, 55.0, 86.0, 103.0, 170.0, 258.0, 453.0, 760.0, 1460.0, 3132.0, 8263.0, 31001.0, 199898.0, 686888.0, 88083.0, 17353.0, 5485.0, 2203.0, 1082.0, 601.0, 371.0, 231.0, 149.0, 99.0, 80.0, 51.0, 31.0, 22.0, 9.0, 12.0, 10.0, 11.0, 3.0, 8.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-261.25, -253.849609375, -246.44921875, -239.048828125, -231.6484375, -224.248046875, -216.84765625, -209.447265625, -202.046875, -194.646484375, -187.24609375, -179.845703125, -172.4453125, -165.044921875, -157.64453125, -150.244140625, -142.84375, -135.443359375, -128.04296875, -120.642578125, -113.2421875, -105.841796875, -98.44140625, -91.041015625, -83.640625, -76.240234375, -68.83984375, -61.439453125, -54.0390625, -46.638671875, -39.23828125, -31.837890625, -24.4375, -17.037109375, -9.63671875, -2.236328125, 5.1640625, 12.564453125, 19.96484375, 27.365234375, 34.765625, 42.166015625, 49.56640625, 56.966796875, 64.3671875, 71.767578125, 79.16796875, 86.568359375, 93.96875, 101.369140625, 108.76953125, 116.169921875, 123.5703125, 130.970703125, 138.37109375, 145.771484375, 153.171875, 160.572265625, 167.97265625, 175.373046875, 182.7734375, 190.173828125, 197.57421875, 204.974609375, 212.375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 5.0, 9.0, 6.0, 10.0, 12.0, 27.0, 30.0, 30.0, 33.0, 49.0, 39.0, 57.0, 79.0, 73.0, 78.0, 51.0, 59.0, 57.0, 43.0, 51.0, 40.0, 29.0, 32.0, 18.0, 23.0, 9.0, 11.0, 10.0, 11.0, 2.0, 7.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-355.5, -346.341796875, -337.18359375, -328.025390625, -318.8671875, -309.708984375, -300.55078125, -291.392578125, -282.234375, -273.076171875, -263.91796875, -254.759765625, -245.6015625, -236.443359375, -227.28515625, -218.126953125, -208.96875, -199.810546875, -190.65234375, -181.494140625, -172.3359375, -163.177734375, -154.01953125, -144.861328125, -135.703125, -126.544921875, -117.38671875, -108.228515625, -99.0703125, -89.912109375, -80.75390625, -71.595703125, -62.4375, -53.279296875, -44.12109375, -34.962890625, -25.8046875, -16.646484375, -7.48828125, 1.669921875, 10.828125, 19.986328125, 29.14453125, 38.302734375, 47.4609375, 56.619140625, 65.77734375, 74.935546875, 84.09375, 93.251953125, 102.41015625, 111.568359375, 120.7265625, 129.884765625, 139.04296875, 148.201171875, 157.359375, 166.517578125, 175.67578125, 184.833984375, 193.9921875, 203.150390625, 212.30859375, 221.466796875, 230.625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 9.0, 12.0, 39.0, 76.0, 255.0, 1266.0, 16245.0, 997005.0, 31395.0, 1753.0, 343.0, 89.0, 36.0, 11.0, 6.0, 6.0, 6.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-208.125, -198.908203125, -189.69140625, -180.474609375, -171.2578125, -162.041015625, -152.82421875, -143.607421875, -134.390625, -125.173828125, -115.95703125, -106.740234375, -97.5234375, -88.306640625, -79.08984375, -69.873046875, -60.65625, -51.439453125, -42.22265625, -33.005859375, -23.7890625, -14.572265625, -5.35546875, 3.861328125, 13.078125, 22.294921875, 31.51171875, 40.728515625, 49.9453125, 59.162109375, 68.37890625, 77.595703125, 86.8125, 96.029296875, 105.24609375, 114.462890625, 123.6796875, 132.896484375, 142.11328125, 151.330078125, 160.546875, 169.763671875, 178.98046875, 188.197265625, 197.4140625, 206.630859375, 215.84765625, 225.064453125, 234.28125, 243.498046875, 252.71484375, 261.931640625, 271.1484375, 280.365234375, 289.58203125, 298.798828125, 308.015625, 317.232421875, 326.44921875, 335.666015625, 344.8828125, 354.099609375, 363.31640625, 372.533203125, 381.75]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 12.0, 12.0, 15.0, 24.0, 40.0, 62.0, 115.0, 179.0, 213.0, 102.0, 71.0, 62.0, 34.0, 19.0, 13.0, 5.0, 5.0, 2.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024078369140625, -0.0232236385345459, -0.022368907928466797, -0.021514177322387695, -0.020659446716308594, -0.019804716110229492, -0.01894998550415039, -0.01809525489807129, -0.017240524291992188, -0.016385793685913086, -0.015531063079833984, -0.014676332473754883, -0.013821601867675781, -0.01296687126159668, -0.012112140655517578, -0.011257410049438477, -0.010402679443359375, -0.009547948837280273, -0.008693218231201172, -0.00783848762512207, -0.006983757019042969, -0.006129026412963867, -0.005274295806884766, -0.004419565200805664, -0.0035648345947265625, -0.002710103988647461, -0.0018553733825683594, -0.0010006427764892578, -0.00014591217041015625, 0.0007088184356689453, 0.0015635490417480469, 0.0024182796478271484, 0.00327301025390625, 0.0041277408599853516, 0.004982471466064453, 0.005837202072143555, 0.006691932678222656, 0.007546663284301758, 0.00840139389038086, 0.009256124496459961, 0.010110855102539062, 0.010965585708618164, 0.011820316314697266, 0.012675046920776367, 0.013529777526855469, 0.01438450813293457, 0.015239238739013672, 0.016093969345092773, 0.016948699951171875, 0.017803430557250977, 0.018658161163330078, 0.01951289176940918, 0.02036762237548828, 0.021222352981567383, 0.022077083587646484, 0.022931814193725586, 0.023786544799804688, 0.02464127540588379, 0.02549600601196289, 0.026350736618041992, 0.027205467224121094, 0.028060197830200195, 0.028914928436279297, 0.0297696590423584, 0.0306243896484375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 1.0, 4.0, 12.0, 25.0, 41.0, 65.0, 192.0, 483.0, 1803.0, 14574.0, 931053.0, 94637.0, 4236.0, 908.0, 280.0, 122.0, 52.0, 28.0, 18.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-266.25, -259.1953125, -252.140625, -245.0859375, -238.03125, -230.9765625, -223.921875, -216.8671875, -209.8125, -202.7578125, -195.703125, -188.6484375, -181.59375, -174.5390625, -167.484375, -160.4296875, -153.375, -146.3203125, -139.265625, -132.2109375, -125.15625, -118.1015625, -111.046875, -103.9921875, -96.9375, -89.8828125, -82.828125, -75.7734375, -68.71875, -61.6640625, -54.609375, -47.5546875, -40.5, -33.4453125, -26.390625, -19.3359375, -12.28125, -5.2265625, 1.828125, 8.8828125, 15.9375, 22.9921875, 30.046875, 37.1015625, 44.15625, 51.2109375, 58.265625, 65.3203125, 72.375, 79.4296875, 86.484375, 93.5390625, 100.59375, 107.6484375, 114.703125, 121.7578125, 128.8125, 135.8671875, 142.921875, 149.9765625, 157.03125, 164.0859375, 171.140625, 178.1953125, 185.25]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 6.0, 15.0, 27.0, 50.0, 77.0, 89.0, 134.0, 181.0, 134.0, 81.0, 54.0, 38.0, 31.0, 19.0, 18.0, 6.0, 11.0, 6.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.625, -120.900390625, -117.17578125, -113.451171875, -109.7265625, -106.001953125, -102.27734375, -98.552734375, -94.828125, -91.103515625, -87.37890625, -83.654296875, -79.9296875, -76.205078125, -72.48046875, -68.755859375, -65.03125, -61.306640625, -57.58203125, -53.857421875, -50.1328125, -46.408203125, -42.68359375, -38.958984375, -35.234375, -31.509765625, -27.78515625, -24.060546875, -20.3359375, -16.611328125, -12.88671875, -9.162109375, -5.4375, -1.712890625, 2.01171875, 5.736328125, 9.4609375, 13.185546875, 16.91015625, 20.634765625, 24.359375, 28.083984375, 31.80859375, 35.533203125, 39.2578125, 42.982421875, 46.70703125, 50.431640625, 54.15625, 57.880859375, 61.60546875, 65.330078125, 69.0546875, 72.779296875, 76.50390625, 80.228515625, 83.953125, 87.677734375, 91.40234375, 95.126953125, 98.8515625, 102.576171875, 106.30078125, 110.025390625, 113.75]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 10.0, 16.0, 31.0, 87.0, 187.0, 278.0, 199.0, 109.0, 49.0, 21.0, 2.0, 7.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2960.446044921875, -2883.841552734375, -2807.23681640625, -2730.63232421875, -2654.027587890625, -2577.423095703125, -2500.818359375, -2424.2138671875, -2347.609375, -2271.0048828125, -2194.400146484375, -2117.795654296875, -2041.19091796875, -1964.58642578125, -1887.9818115234375, -1811.377197265625, -1734.7724609375, -1658.1678466796875, -1581.563232421875, -1504.9586181640625, -1428.35400390625, -1351.74951171875, -1275.1448974609375, -1198.540283203125, -1121.9356689453125, -1045.3310546875, -968.7264404296875, -892.1218872070312, -815.5172729492188, -738.9126586914062, -662.30810546875, -585.7034912109375, -509.098876953125, -432.4942626953125, -355.8896789550781, -279.28509521484375, -202.68048095703125, -126.07586669921875, -49.471282958984375, 27.13330078125, 103.7379150390625, 180.34251403808594, 256.9471130371094, 333.55169677734375, 410.15631103515625, 486.76092529296875, 563.365478515625, 639.9700927734375, 716.57470703125, 793.1793212890625, 869.783935546875, 946.3884887695312, 1022.9931030273438, 1099.59765625, 1176.2022705078125, 1252.806884765625, 1329.4114990234375, 1406.01611328125, 1482.6207275390625, 1559.225341796875, 1635.829833984375, 1712.4345703125, 1789.0390625, 1865.6436767578125, 1942.248291015625]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 7.0, 8.0, 5.0, 8.0, 15.0, 11.0, 18.0, 22.0, 19.0, 24.0, 26.0, 44.0, 46.0, 41.0, 41.0, 60.0, 56.0, 60.0, 56.0, 59.0, 41.0, 46.0, 38.0, 37.0, 33.0, 32.0, 26.0, 19.0, 16.0, 20.0, 14.0, 14.0, 7.0, 12.0, 7.0, 5.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1078.828369140625, -1048.6292724609375, -1018.4302368164062, -988.231201171875, -958.0321044921875, -927.8330688476562, -897.634033203125, -867.4349365234375, -837.23583984375, -807.0368041992188, -776.8377075195312, -746.638671875, -716.4395751953125, -686.2405395507812, -656.04150390625, -625.8424072265625, -595.6433715820312, -565.4443359375, -535.2452392578125, -505.04620361328125, -474.84710693359375, -444.6480712890625, -414.4490051269531, -384.24993896484375, -354.0508728027344, -323.851806640625, -293.6527404785156, -263.45367431640625, -233.25462341308594, -203.05555725097656, -172.85650634765625, -142.65744018554688, -112.45843505859375, -82.25936889648438, -52.06031036376953, -21.861251831054688, 8.337814331054688, 38.53688049316406, 68.73593139648438, 98.93499755859375, 129.13406372070312, 159.3331298828125, 189.53219604492188, 219.7312469482422, 249.93031311035156, 280.12939453125, 310.32843017578125, 340.5274963378906, 370.7265625, 400.9256286621094, 431.12469482421875, 461.32373046875, 491.5228271484375, 521.7218627929688, 551.9208984375, 582.1199951171875, 612.319091796875, 642.5181274414062, 672.7172241210938, 702.916259765625, 733.1153564453125, 763.3143920898438, 793.513427734375, 823.7125244140625, 853.9115600585938]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 7.0, 2.0, 5.0, 8.0, 10.0, 19.0, 18.0, 28.0, 44.0, 83.0, 148.0, 239.0, 454.0, 977.0, 2355.0, 6384.0, 21368.0, 122959.0, 3067494.0, 894796.0, 56314.0, 13282.0, 4299.0, 1537.0, 682.0, 353.0, 162.0, 99.0, 57.0, 38.0, 25.0, 14.0, 9.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-136.875, -132.826171875, -128.77734375, -124.728515625, -120.6796875, -116.630859375, -112.58203125, -108.533203125, -104.484375, -100.435546875, -96.38671875, -92.337890625, -88.2890625, -84.240234375, -80.19140625, -76.142578125, -72.09375, -68.044921875, -63.99609375, -59.947265625, -55.8984375, -51.849609375, -47.80078125, -43.751953125, -39.703125, -35.654296875, -31.60546875, -27.556640625, -23.5078125, -19.458984375, -15.41015625, -11.361328125, -7.3125, -3.263671875, 0.78515625, 4.833984375, 8.8828125, 12.931640625, 16.98046875, 21.029296875, 25.078125, 29.126953125, 33.17578125, 37.224609375, 41.2734375, 45.322265625, 49.37109375, 53.419921875, 57.46875, 61.517578125, 65.56640625, 69.615234375, 73.6640625, 77.712890625, 81.76171875, 85.810546875, 89.859375, 93.908203125, 97.95703125, 102.005859375, 106.0546875, 110.103515625, 114.15234375, 118.201171875, 122.25]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 12.0, 16.0, 20.0, 29.0, 32.0, 52.0, 65.0, 77.0, 87.0, 102.0, 94.0, 95.0, 65.0, 64.0, 49.0, 40.0, 35.0, 22.0, 15.0, 10.0, 10.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.625, -96.939453125, -94.25390625, -91.568359375, -88.8828125, -86.197265625, -83.51171875, -80.826171875, -78.140625, -75.455078125, -72.76953125, -70.083984375, -67.3984375, -64.712890625, -62.02734375, -59.341796875, -56.65625, -53.970703125, -51.28515625, -48.599609375, -45.9140625, -43.228515625, -40.54296875, -37.857421875, -35.171875, -32.486328125, -29.80078125, -27.115234375, -24.4296875, -21.744140625, -19.05859375, -16.373046875, -13.6875, -11.001953125, -8.31640625, -5.630859375, -2.9453125, -0.259765625, 2.42578125, 5.111328125, 7.796875, 10.482421875, 13.16796875, 15.853515625, 18.5390625, 21.224609375, 23.91015625, 26.595703125, 29.28125, 31.966796875, 34.65234375, 37.337890625, 40.0234375, 42.708984375, 45.39453125, 48.080078125, 50.765625, 53.451171875, 56.13671875, 58.822265625, 61.5078125, 64.193359375, 66.87890625, 69.564453125, 72.25]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 15.0, 15.0, 20.0, 40.0, 80.0, 132.0, 279.0, 564.0, 1447.0, 4270.0, 16446.0, 98302.0, 3473502.0, 546206.0, 40005.0, 8208.0, 2579.0, 1070.0, 478.0, 238.0, 169.0, 81.0, 35.0, 35.0, 18.0, 7.0, 13.0, 9.0, 10.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-210.875, -203.794921875, -196.71484375, -189.634765625, -182.5546875, -175.474609375, -168.39453125, -161.314453125, -154.234375, -147.154296875, -140.07421875, -132.994140625, -125.9140625, -118.833984375, -111.75390625, -104.673828125, -97.59375, -90.513671875, -83.43359375, -76.353515625, -69.2734375, -62.193359375, -55.11328125, -48.033203125, -40.953125, -33.873046875, -26.79296875, -19.712890625, -12.6328125, -5.552734375, 1.52734375, 8.607421875, 15.6875, 22.767578125, 29.84765625, 36.927734375, 44.0078125, 51.087890625, 58.16796875, 65.248046875, 72.328125, 79.408203125, 86.48828125, 93.568359375, 100.6484375, 107.728515625, 114.80859375, 121.888671875, 128.96875, 136.048828125, 143.12890625, 150.208984375, 157.2890625, 164.369140625, 171.44921875, 178.529296875, 185.609375, 192.689453125, 199.76953125, 206.849609375, 213.9296875, 221.009765625, 228.08984375, 235.169921875, 242.25]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 7.0, 6.0, 8.0, 15.0, 21.0, 26.0, 19.0, 28.0, 25.0, 59.0, 55.0, 104.0, 180.0, 293.0, 649.0, 1033.0, 692.0, 304.0, 177.0, 97.0, 68.0, 45.0, 44.0, 25.0, 27.0, 8.0, 13.0, 11.0, 4.0, 4.0, 2.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-145.375, -139.875, -134.375, -128.875, -123.375, -117.875, -112.375, -106.875, -101.375, -95.875, -90.375, -84.875, -79.375, -73.875, -68.375, -62.875, -57.375, -51.875, -46.375, -40.875, -35.375, -29.875, -24.375, -18.875, -13.375, -7.875, -2.375, 3.125, 8.625, 14.125, 19.625, 25.125, 30.625, 36.125, 41.625, 47.125, 52.625, 58.125, 63.625, 69.125, 74.625, 80.125, 85.625, 91.125, 96.625, 102.125, 107.625, 113.125, 118.625, 124.125, 129.625, 135.125, 140.625, 146.125, 151.625, 157.125, 162.625, 168.125, 173.625, 179.125, 184.625, 190.125, 195.625, 201.125, 206.625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 5.0, 11.0, 14.0, 25.0, 60.0, 120.0, 204.0, 237.0, 169.0, 84.0, 39.0, 9.0, 10.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1396.2216796875, -1333.9627685546875, -1271.703857421875, -1209.4449462890625, -1147.18603515625, -1084.927001953125, -1022.6680908203125, -960.4091796875, -898.1502685546875, -835.891357421875, -773.6324462890625, -711.3734741210938, -649.1145629882812, -586.8556518554688, -524.5966796875, -462.3377685546875, -400.078857421875, -337.8199462890625, -275.5610046386719, -213.3020782470703, -151.04315185546875, -88.78424072265625, -26.525299072265625, 35.733642578125, 97.9925537109375, 160.25148010253906, 222.51040649414062, 284.76934814453125, 347.02825927734375, 409.28717041015625, 471.5461120605469, 533.8050537109375, 596.06396484375, 658.3228759765625, 720.581787109375, 782.8407592773438, 845.0996704101562, 907.3585815429688, 969.6175537109375, 1031.87646484375, 1094.1353759765625, 1156.394287109375, 1218.6531982421875, 1280.912109375, 1343.171142578125, 1405.429931640625, 1467.68896484375, 1529.9478759765625, 1592.206787109375, 1654.4656982421875, 1716.724609375, 1778.9835205078125, 1841.242431640625, 1903.50146484375, 1965.7603759765625, 2028.019287109375, 2090.2783203125, 2152.537353515625, 2214.796142578125, 2277.05517578125, 2339.31396484375, 2401.572998046875, 2463.831787109375, 2526.0908203125, 2588.349609375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 10.0, 3.0, 6.0, 8.0, 5.0, 10.0, 16.0, 16.0, 17.0, 13.0, 26.0, 22.0, 31.0, 31.0, 26.0, 30.0, 46.0, 45.0, 49.0, 44.0, 41.0, 56.0, 61.0, 40.0, 41.0, 39.0, 30.0, 28.0, 24.0, 22.0, 21.0, 29.0, 27.0, 19.0, 11.0, 12.0, 14.0, 4.0, 8.0, 6.0, 4.0, 6.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-768.3534545898438, -744.3721313476562, -720.3908081054688, -696.4094848632812, -672.4281005859375, -648.44677734375, -624.4654541015625, -600.484130859375, -576.5028076171875, -552.521484375, -528.5401611328125, -504.5588073730469, -480.5774841308594, -456.5961608886719, -432.61480712890625, -408.63348388671875, -384.65216064453125, -360.67083740234375, -336.68951416015625, -312.7081604003906, -288.7268371582031, -264.7455139160156, -240.76417541503906, -216.7828369140625, -192.801513671875, -168.8201904296875, -144.83885192871094, -120.8575210571289, -96.87619018554688, -72.89485931396484, -48.91352844238281, -24.93218994140625, -0.9508056640625, 23.03052520751953, 47.01185607910156, 70.9931869506836, 94.97451782226562, 118.95584869384766, 142.9371795654297, 166.91851806640625, 190.89984130859375, 214.88116455078125, 238.8625030517578, 262.8438415527344, 286.8251647949219, 310.8064880371094, 334.787841796875, 358.7691650390625, 382.75048828125, 406.7318115234375, 430.713134765625, 454.6944885253906, 478.6758117675781, 502.6571350097656, 526.6384887695312, 550.6198120117188, 574.6011352539062, 598.5824584960938, 622.5637817382812, 646.5451049804688, 670.5264892578125, 694.5078125, 718.4891357421875, 742.470458984375, 766.4517822265625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 5.0, 6.0, 8.0, 14.0, 25.0, 40.0, 47.0, 66.0, 97.0, 191.0, 334.0, 628.0, 1142.0, 2436.0, 5237.0, 11780.0, 27985.0, 69960.0, 190559.0, 406538.0, 204485.0, 74394.0, 29464.0, 12280.0, 5521.0, 2513.0, 1271.0, 650.0, 336.0, 184.0, 116.0, 76.0, 48.0, 32.0, 17.0, 15.0, 9.0, 11.0, 8.0, 6.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-116.5, -112.9189453125, -109.337890625, -105.7568359375, -102.17578125, -98.5947265625, -95.013671875, -91.4326171875, -87.8515625, -84.2705078125, -80.689453125, -77.1083984375, -73.52734375, -69.9462890625, -66.365234375, -62.7841796875, -59.203125, -55.6220703125, -52.041015625, -48.4599609375, -44.87890625, -41.2978515625, -37.716796875, -34.1357421875, -30.5546875, -26.9736328125, -23.392578125, -19.8115234375, -16.23046875, -12.6494140625, -9.068359375, -5.4873046875, -1.90625, 1.6748046875, 5.255859375, 8.8369140625, 12.41796875, 15.9990234375, 19.580078125, 23.1611328125, 26.7421875, 30.3232421875, 33.904296875, 37.4853515625, 41.06640625, 44.6474609375, 48.228515625, 51.8095703125, 55.390625, 58.9716796875, 62.552734375, 66.1337890625, 69.71484375, 73.2958984375, 76.876953125, 80.4580078125, 84.0390625, 87.6201171875, 91.201171875, 94.7822265625, 98.36328125, 101.9443359375, 105.525390625, 109.1064453125, 112.6875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 5.0, 11.0, 13.0, 18.0, 19.0, 12.0, 26.0, 19.0, 16.0, 21.0, 34.0, 33.0, 36.0, 48.0, 50.0, 44.0, 38.0, 47.0, 44.0, 46.0, 48.0, 38.0, 40.0, 50.0, 40.0, 19.0, 39.0, 28.0, 24.0, 16.0, 21.0, 11.0, 5.0, 9.0, 11.0, 7.0, 2.0, 7.0, 6.0, 1.0, 5.0, 2.0, 4.0], "bins": [-62.84375, -61.2421875, -59.640625, -58.0390625, -56.4375, -54.8359375, -53.234375, -51.6328125, -50.03125, -48.4296875, -46.828125, -45.2265625, -43.625, -42.0234375, -40.421875, -38.8203125, -37.21875, -35.6171875, -34.015625, -32.4140625, -30.8125, -29.2109375, -27.609375, -26.0078125, -24.40625, -22.8046875, -21.203125, -19.6015625, -18.0, -16.3984375, -14.796875, -13.1953125, -11.59375, -9.9921875, -8.390625, -6.7890625, -5.1875, -3.5859375, -1.984375, -0.3828125, 1.21875, 2.8203125, 4.421875, 6.0234375, 7.625, 9.2265625, 10.828125, 12.4296875, 14.03125, 15.6328125, 17.234375, 18.8359375, 20.4375, 22.0390625, 23.640625, 25.2421875, 26.84375, 28.4453125, 30.046875, 31.6484375, 33.25, 34.8515625, 36.453125, 38.0546875, 39.65625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 10.0, 12.0, 8.0, 14.0, 24.0, 16.0, 30.0, 28.0, 49.0, 65.0, 104.0, 164.0, 254.0, 363.0, 573.0, 1074.0, 2215.0, 5820.0, 22800.0, 221181.0, 726178.0, 51329.0, 9606.0, 3170.0, 1405.0, 749.0, 459.0, 260.0, 165.0, 112.0, 87.0, 58.0, 42.0, 28.0, 18.0, 13.0, 14.0, 14.0, 6.0, 7.0, 4.0, 7.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-316.25, -306.7265625, -297.203125, -287.6796875, -278.15625, -268.6328125, -259.109375, -249.5859375, -240.0625, -230.5390625, -221.015625, -211.4921875, -201.96875, -192.4453125, -182.921875, -173.3984375, -163.875, -154.3515625, -144.828125, -135.3046875, -125.78125, -116.2578125, -106.734375, -97.2109375, -87.6875, -78.1640625, -68.640625, -59.1171875, -49.59375, -40.0703125, -30.546875, -21.0234375, -11.5, -1.9765625, 7.546875, 17.0703125, 26.59375, 36.1171875, 45.640625, 55.1640625, 64.6875, 74.2109375, 83.734375, 93.2578125, 102.78125, 112.3046875, 121.828125, 131.3515625, 140.875, 150.3984375, 159.921875, 169.4453125, 178.96875, 188.4921875, 198.015625, 207.5390625, 217.0625, 226.5859375, 236.109375, 245.6328125, 255.15625, 264.6796875, 274.203125, 283.7265625, 293.25]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 6.0, 10.0, 8.0, 7.0, 15.0, 14.0, 28.0, 27.0, 23.0, 35.0, 30.0, 45.0, 48.0, 48.0, 55.0, 56.0, 65.0, 69.0, 57.0, 54.0, 46.0, 42.0, 41.0, 30.0, 31.0, 18.0, 11.0, 17.0, 14.0, 13.0, 8.0, 6.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-290.75, -281.7734375, -272.796875, -263.8203125, -254.84375, -245.8671875, -236.890625, -227.9140625, -218.9375, -209.9609375, -200.984375, -192.0078125, -183.03125, -174.0546875, -165.078125, -156.1015625, -147.125, -138.1484375, -129.171875, -120.1953125, -111.21875, -102.2421875, -93.265625, -84.2890625, -75.3125, -66.3359375, -57.359375, -48.3828125, -39.40625, -30.4296875, -21.453125, -12.4765625, -3.5, 5.4765625, 14.453125, 23.4296875, 32.40625, 41.3828125, 50.359375, 59.3359375, 68.3125, 77.2890625, 86.265625, 95.2421875, 104.21875, 113.1953125, 122.171875, 131.1484375, 140.125, 149.1015625, 158.078125, 167.0546875, 176.03125, 185.0078125, 193.984375, 202.9609375, 211.9375, 220.9140625, 229.890625, 238.8671875, 247.84375, 256.8203125, 265.796875, 274.7734375, 283.75]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 2.0, 10.0, 10.0, 22.0, 36.0, 45.0, 59.0, 100.0, 144.0, 233.0, 462.0, 962.0, 2519.0, 10199.0, 71975.0, 816443.0, 124875.0, 14530.0, 3538.0, 1160.0, 529.0, 235.0, 153.0, 106.0, 62.0, 34.0, 36.0, 24.0, 16.0, 9.0, 4.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.125, -76.1513671875, -73.177734375, -70.2041015625, -67.23046875, -64.2568359375, -61.283203125, -58.3095703125, -55.3359375, -52.3623046875, -49.388671875, -46.4150390625, -43.44140625, -40.4677734375, -37.494140625, -34.5205078125, -31.546875, -28.5732421875, -25.599609375, -22.6259765625, -19.65234375, -16.6787109375, -13.705078125, -10.7314453125, -7.7578125, -4.7841796875, -1.810546875, 1.1630859375, 4.13671875, 7.1103515625, 10.083984375, 13.0576171875, 16.03125, 19.0048828125, 21.978515625, 24.9521484375, 27.92578125, 30.8994140625, 33.873046875, 36.8466796875, 39.8203125, 42.7939453125, 45.767578125, 48.7412109375, 51.71484375, 54.6884765625, 57.662109375, 60.6357421875, 63.609375, 66.5830078125, 69.556640625, 72.5302734375, 75.50390625, 78.4775390625, 81.451171875, 84.4248046875, 87.3984375, 90.3720703125, 93.345703125, 96.3193359375, 99.29296875, 102.2666015625, 105.240234375, 108.2138671875, 111.1875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 1.0, 2.0, 7.0, 8.0, 6.0, 4.0, 7.0, 9.0, 16.0, 11.0, 21.0, 16.0, 38.0, 33.0, 48.0, 58.0, 75.0, 96.0, 91.0, 101.0, 80.0, 53.0, 39.0, 32.0, 29.0, 26.0, 24.0, 20.0, 7.0, 8.0, 6.0, 6.0, 4.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01372528076171875, -0.013242363929748535, -0.01275944709777832, -0.012276530265808105, -0.01179361343383789, -0.011310696601867676, -0.010827779769897461, -0.010344862937927246, -0.009861946105957031, -0.009379029273986816, -0.008896112442016602, -0.008413195610046387, -0.007930278778076172, -0.007447361946105957, -0.006964445114135742, -0.006481528282165527, -0.0059986114501953125, -0.005515694618225098, -0.005032777786254883, -0.004549860954284668, -0.004066944122314453, -0.0035840272903442383, -0.0031011104583740234, -0.0026181936264038086, -0.0021352767944335938, -0.001652359962463379, -0.001169443130493164, -0.0006865262985229492, -0.00020360946655273438, 0.00027930736541748047, 0.0007622241973876953, 0.0012451410293579102, 0.001728057861328125, 0.00221097469329834, 0.0026938915252685547, 0.0031768083572387695, 0.0036597251892089844, 0.004142642021179199, 0.004625558853149414, 0.005108475685119629, 0.005591392517089844, 0.006074309349060059, 0.0065572261810302734, 0.007040143013000488, 0.007523059844970703, 0.008005976676940918, 0.008488893508911133, 0.008971810340881348, 0.009454727172851562, 0.009937644004821777, 0.010420560836791992, 0.010903477668762207, 0.011386394500732422, 0.011869311332702637, 0.012352228164672852, 0.012835144996643066, 0.013318061828613281, 0.013800978660583496, 0.014283895492553711, 0.014766812324523926, 0.01524972915649414, 0.015732645988464355, 0.01621556282043457, 0.016698479652404785, 0.017181396484375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 3.0, 3.0, 6.0, 6.0, 10.0, 9.0, 19.0, 11.0, 21.0, 25.0, 39.0, 63.0, 91.0, 100.0, 181.0, 266.0, 457.0, 873.0, 1794.0, 4704.0, 16920.0, 133452.0, 793614.0, 76295.0, 12421.0, 3816.0, 1430.0, 681.0, 445.0, 259.0, 158.0, 108.0, 61.0, 36.0, 42.0, 26.0, 27.0, 19.0, 13.0, 12.0, 6.0, 11.0, 9.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-76.6875, -74.1640625, -71.640625, -69.1171875, -66.59375, -64.0703125, -61.546875, -59.0234375, -56.5, -53.9765625, -51.453125, -48.9296875, -46.40625, -43.8828125, -41.359375, -38.8359375, -36.3125, -33.7890625, -31.265625, -28.7421875, -26.21875, -23.6953125, -21.171875, -18.6484375, -16.125, -13.6015625, -11.078125, -8.5546875, -6.03125, -3.5078125, -0.984375, 1.5390625, 4.0625, 6.5859375, 9.109375, 11.6328125, 14.15625, 16.6796875, 19.203125, 21.7265625, 24.25, 26.7734375, 29.296875, 31.8203125, 34.34375, 36.8671875, 39.390625, 41.9140625, 44.4375, 46.9609375, 49.484375, 52.0078125, 54.53125, 57.0546875, 59.578125, 62.1015625, 64.625, 67.1484375, 69.671875, 72.1953125, 74.71875, 77.2421875, 79.765625, 82.2890625, 84.8125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 7.0, 5.0, 6.0, 4.0, 7.0, 11.0, 18.0, 17.0, 28.0, 44.0, 47.0, 66.0, 71.0, 72.0, 99.0, 97.0, 88.0, 62.0, 61.0, 43.0, 31.0, 31.0, 21.0, 23.0, 8.0, 5.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.5, -64.111328125, -61.72265625, -59.333984375, -56.9453125, -54.556640625, -52.16796875, -49.779296875, -47.390625, -45.001953125, -42.61328125, -40.224609375, -37.8359375, -35.447265625, -33.05859375, -30.669921875, -28.28125, -25.892578125, -23.50390625, -21.115234375, -18.7265625, -16.337890625, -13.94921875, -11.560546875, -9.171875, -6.783203125, -4.39453125, -2.005859375, 0.3828125, 2.771484375, 5.16015625, 7.548828125, 9.9375, 12.326171875, 14.71484375, 17.103515625, 19.4921875, 21.880859375, 24.26953125, 26.658203125, 29.046875, 31.435546875, 33.82421875, 36.212890625, 38.6015625, 40.990234375, 43.37890625, 45.767578125, 48.15625, 50.544921875, 52.93359375, 55.322265625, 57.7109375, 60.099609375, 62.48828125, 64.876953125, 67.265625, 69.654296875, 72.04296875, 74.431640625, 76.8203125, 79.208984375, 81.59765625, 83.986328125, 86.375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 4.0, 8.0, 8.0, 15.0, 57.0, 80.0, 122.0, 258.0, 181.0, 120.0, 72.0, 23.0, 21.0, 11.0, 9.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1689.157958984375, -1630.450927734375, -1571.743896484375, -1513.036865234375, -1454.329833984375, -1395.622802734375, -1336.915771484375, -1278.208740234375, -1219.501708984375, -1160.794677734375, -1102.087646484375, -1043.380615234375, -984.673583984375, -925.966552734375, -867.259521484375, -808.552490234375, -749.8455200195312, -691.1384887695312, -632.4314575195312, -573.7244262695312, -515.0173950195312, -456.3103942871094, -397.6033630371094, -338.8963317871094, -280.1893005371094, -221.48226928710938, -162.77523803710938, -104.06822204589844, -45.36119079589844, 13.3458251953125, 72.0528564453125, 130.7598876953125, 189.4669189453125, 248.1739501953125, 306.8809814453125, 365.5880126953125, 424.2950439453125, 483.0020446777344, 541.7091064453125, 600.4161376953125, 659.1231689453125, 717.8302001953125, 776.5372314453125, 835.2442626953125, 893.9512939453125, 952.6583251953125, 1011.3653564453125, 1070.0723876953125, 1128.779296875, 1187.486328125, 1246.193359375, 1304.900390625, 1363.607421875, 1422.314453125, 1481.021484375, 1539.728515625, 1598.435546875, 1657.142578125, 1715.849609375, 1774.556640625, 1833.263671875, 1891.970703125, 1950.677734375, 2009.384765625, 2068.091796875]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 4.0, 7.0, 2.0, 13.0, 13.0, 13.0, 11.0, 14.0, 19.0, 23.0, 28.0, 24.0, 50.0, 27.0, 31.0, 46.0, 47.0, 64.0, 73.0, 69.0, 65.0, 53.0, 35.0, 40.0, 39.0, 38.0, 20.0, 20.0, 22.0, 15.0, 15.0, 11.0, 14.0, 10.0, 6.0, 6.0, 5.0, 3.0, 0.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1019.6337890625, -986.46142578125, -953.2890014648438, -920.1165771484375, -886.9442138671875, -853.7718505859375, -820.5994262695312, -787.427001953125, -754.254638671875, -721.082275390625, -687.9098510742188, -654.7374267578125, -621.5650634765625, -588.3927001953125, -555.2202758789062, -522.0478515625, -488.87548828125, -455.7030944824219, -422.53070068359375, -389.3583068847656, -356.1859130859375, -323.0135192871094, -289.84112548828125, -256.6687316894531, -223.496337890625, -190.32394409179688, -157.15155029296875, -123.97915649414062, -90.8067626953125, -57.634368896484375, -24.46197509765625, 8.710418701171875, 41.8829345703125, 75.05532836914062, 108.22772216796875, 141.40011596679688, 174.572509765625, 207.74490356445312, 240.91729736328125, 274.0896911621094, 307.2620849609375, 340.4344787597656, 373.60687255859375, 406.7792663574219, 439.95166015625, 473.1240539550781, 506.29644775390625, 539.4688720703125, 572.6412353515625, 605.8135986328125, 638.9860229492188, 672.158447265625, 705.330810546875, 738.503173828125, 771.6755981445312, 804.8480224609375, 838.0203857421875, 871.1927490234375, 904.3651733398438, 937.53759765625, 970.7099609375, 1003.88232421875, 1037.0546875, 1070.2271728515625, 1103.3995361328125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 8.0, 6.0, 27.0, 52.0, 107.0, 294.0, 955.0, 3392.0, 19567.0, 528271.0, 3568289.0, 63508.0, 7350.0, 1617.0, 542.0, 179.0, 70.0, 34.0, 14.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-305.25, -299.1748046875, -293.099609375, -287.0244140625, -280.94921875, -274.8740234375, -268.798828125, -262.7236328125, -256.6484375, -250.5732421875, -244.498046875, -238.4228515625, -232.34765625, -226.2724609375, -220.197265625, -214.1220703125, -208.046875, -201.9716796875, -195.896484375, -189.8212890625, -183.74609375, -177.6708984375, -171.595703125, -165.5205078125, -159.4453125, -153.3701171875, -147.294921875, -141.2197265625, -135.14453125, -129.0693359375, -122.994140625, -116.9189453125, -110.84375, -104.7685546875, -98.693359375, -92.6181640625, -86.54296875, -80.4677734375, -74.392578125, -68.3173828125, -62.2421875, -56.1669921875, -50.091796875, -44.0166015625, -37.94140625, -31.8662109375, -25.791015625, -19.7158203125, -13.640625, -7.5654296875, -1.490234375, 4.5849609375, 10.66015625, 16.7353515625, 22.810546875, 28.8857421875, 34.9609375, 41.0361328125, 47.111328125, 53.1865234375, 59.26171875, 65.3369140625, 71.412109375, 77.4873046875, 83.5625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 1.0, 2.0, 4.0, 6.0, 7.0, 5.0, 10.0, 24.0, 10.0, 17.0, 23.0, 26.0, 26.0, 29.0, 39.0, 49.0, 38.0, 44.0, 50.0, 49.0, 55.0, 51.0, 48.0, 51.0, 43.0, 39.0, 41.0, 40.0, 33.0, 26.0, 21.0, 31.0, 20.0, 11.0, 7.0, 7.0, 8.0, 11.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.28125, -43.59716796875, -41.9130859375, -40.22900390625, -38.544921875, -36.86083984375, -35.1767578125, -33.49267578125, -31.80859375, -30.12451171875, -28.4404296875, -26.75634765625, -25.072265625, -23.38818359375, -21.7041015625, -20.02001953125, -18.3359375, -16.65185546875, -14.9677734375, -13.28369140625, -11.599609375, -9.91552734375, -8.2314453125, -6.54736328125, -4.86328125, -3.17919921875, -1.4951171875, 0.18896484375, 1.873046875, 3.55712890625, 5.2412109375, 6.92529296875, 8.609375, 10.29345703125, 11.9775390625, 13.66162109375, 15.345703125, 17.02978515625, 18.7138671875, 20.39794921875, 22.08203125, 23.76611328125, 25.4501953125, 27.13427734375, 28.818359375, 30.50244140625, 32.1865234375, 33.87060546875, 35.5546875, 37.23876953125, 38.9228515625, 40.60693359375, 42.291015625, 43.97509765625, 45.6591796875, 47.34326171875, 49.02734375, 50.71142578125, 52.3955078125, 54.07958984375, 55.763671875, 57.44775390625, 59.1318359375, 60.81591796875, 62.5]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 9.0, 8.0, 8.0, 8.0, 20.0, 30.0, 65.0, 127.0, 285.0, 808.0, 2587.0, 10539.0, 79886.0, 3779901.0, 291828.0, 21967.0, 4224.0, 1210.0, 414.0, 178.0, 92.0, 35.0, 22.0, 7.0, 7.0, 6.0, 10.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-306.75, -297.64453125, -288.5390625, -279.43359375, -270.328125, -261.22265625, -252.1171875, -243.01171875, -233.90625, -224.80078125, -215.6953125, -206.58984375, -197.484375, -188.37890625, -179.2734375, -170.16796875, -161.0625, -151.95703125, -142.8515625, -133.74609375, -124.640625, -115.53515625, -106.4296875, -97.32421875, -88.21875, -79.11328125, -70.0078125, -60.90234375, -51.796875, -42.69140625, -33.5859375, -24.48046875, -15.375, -6.26953125, 2.8359375, 11.94140625, 21.046875, 30.15234375, 39.2578125, 48.36328125, 57.46875, 66.57421875, 75.6796875, 84.78515625, 93.890625, 102.99609375, 112.1015625, 121.20703125, 130.3125, 139.41796875, 148.5234375, 157.62890625, 166.734375, 175.83984375, 184.9453125, 194.05078125, 203.15625, 212.26171875, 221.3671875, 230.47265625, 239.578125, 248.68359375, 257.7890625, 266.89453125, 276.0]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 5.0, 4.0, 6.0, 5.0, 1.0, 9.0, 11.0, 13.0, 19.0, 22.0, 30.0, 63.0, 80.0, 139.0, 235.0, 516.0, 939.0, 858.0, 483.0, 213.0, 108.0, 77.0, 58.0, 42.0, 37.0, 21.0, 24.0, 10.0, 13.0, 3.0, 5.0, 9.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-208.875, -202.724609375, -196.57421875, -190.423828125, -184.2734375, -178.123046875, -171.97265625, -165.822265625, -159.671875, -153.521484375, -147.37109375, -141.220703125, -135.0703125, -128.919921875, -122.76953125, -116.619140625, -110.46875, -104.318359375, -98.16796875, -92.017578125, -85.8671875, -79.716796875, -73.56640625, -67.416015625, -61.265625, -55.115234375, -48.96484375, -42.814453125, -36.6640625, -30.513671875, -24.36328125, -18.212890625, -12.0625, -5.912109375, 0.23828125, 6.388671875, 12.5390625, 18.689453125, 24.83984375, 30.990234375, 37.140625, 43.291015625, 49.44140625, 55.591796875, 61.7421875, 67.892578125, 74.04296875, 80.193359375, 86.34375, 92.494140625, 98.64453125, 104.794921875, 110.9453125, 117.095703125, 123.24609375, 129.396484375, 135.546875, 141.697265625, 147.84765625, 153.998046875, 160.1484375, 166.298828125, 172.44921875, 178.599609375, 184.75]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 4.0, 5.0, 17.0, 43.0, 136.0, 221.0, 290.0, 158.0, 63.0, 25.0, 11.0, 11.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1507.7232666015625, -1433.5953369140625, -1359.4674072265625, -1285.3394775390625, -1211.2115478515625, -1137.0836181640625, -1062.95556640625, -988.8276977539062, -914.6997680664062, -840.5718383789062, -766.4439086914062, -692.31591796875, -618.18798828125, -544.06005859375, -469.93212890625, -395.80419921875, -321.67626953125, -247.54833984375, -173.42039489746094, -99.29244995117188, -25.164520263671875, 48.963409423828125, 123.09136962890625, 197.21929931640625, 271.34722900390625, 345.47515869140625, 419.60308837890625, 493.7310485839844, 567.8590087890625, 641.9869384765625, 716.1148681640625, 790.2427978515625, 864.37060546875, 938.49853515625, 1012.62646484375, 1086.75439453125, 1160.88232421875, 1235.01025390625, 1309.13818359375, 1383.26611328125, 1457.39404296875, 1531.52197265625, 1605.64990234375, 1679.77783203125, 1753.90576171875, 1828.03369140625, 1902.16162109375, 1976.28955078125, 2050.41748046875, 2124.54541015625, 2198.67333984375, 2272.80126953125, 2346.92919921875, 2421.05712890625, 2495.18505859375, 2569.31298828125, 2643.441162109375, 2717.569091796875, 2791.697021484375, 2865.824951171875, 2939.952880859375, 3014.080810546875, 3088.208740234375, 3162.336669921875, 3236.464599609375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 4.0, 1.0, 3.0, 6.0, 5.0, 9.0, 9.0, 11.0, 12.0, 12.0, 19.0, 22.0, 23.0, 32.0, 23.0, 26.0, 46.0, 31.0, 35.0, 46.0, 40.0, 46.0, 41.0, 41.0, 51.0, 49.0, 38.0, 49.0, 41.0, 23.0, 31.0, 31.0, 25.0, 14.0, 19.0, 16.0, 15.0, 9.0, 14.0, 10.0, 5.0, 4.0, 4.0, 7.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-801.9260864257812, -776.4638061523438, -751.0015258789062, -725.5392456054688, -700.0769653320312, -674.6146850585938, -649.1524047851562, -623.6901245117188, -598.2278442382812, -572.7655639648438, -547.3032836914062, -521.8410034179688, -496.37872314453125, -470.91644287109375, -445.45416259765625, -419.99188232421875, -394.5296325683594, -369.0673522949219, -343.6050720214844, -318.1427917480469, -292.6805114746094, -267.2182312011719, -241.75596618652344, -216.29368591308594, -190.83140563964844, -165.36912536621094, -139.90684509277344, -114.44457244873047, -88.98229217529297, -63.52001190185547, -38.0577392578125, -12.595458984375, 12.8668212890625, 38.3291015625, 63.791378021240234, 89.25365447998047, 114.71593475341797, 140.17822265625, 165.64048767089844, 191.10276794433594, 216.56504821777344, 242.02732849121094, 267.4895935058594, 292.9518737792969, 318.4141540527344, 343.8764343261719, 369.3387145996094, 394.8009948730469, 420.2632751464844, 445.7255554199219, 471.1878356933594, 496.6501159667969, 522.1123657226562, 547.5746459960938, 573.0369262695312, 598.4992065429688, 623.9614868164062, 649.4237670898438, 674.8860473632812, 700.3483276367188, 725.8106079101562, 751.2728881835938, 776.7351684570312, 802.1974487304688, 827.6597290039062]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 8.0, 7.0, 6.0, 13.0, 21.0, 30.0, 49.0, 98.0, 152.0, 325.0, 564.0, 1059.0, 2058.0, 4507.0, 10687.0, 27791.0, 84755.0, 292204.0, 424114.0, 131914.0, 41244.0, 14926.0, 6255.0, 2821.0, 1393.0, 699.0, 388.0, 178.0, 110.0, 68.0, 45.0, 29.0, 10.0, 10.0, 7.0, 8.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-163.75, -159.224609375, -154.69921875, -150.173828125, -145.6484375, -141.123046875, -136.59765625, -132.072265625, -127.546875, -123.021484375, -118.49609375, -113.970703125, -109.4453125, -104.919921875, -100.39453125, -95.869140625, -91.34375, -86.818359375, -82.29296875, -77.767578125, -73.2421875, -68.716796875, -64.19140625, -59.666015625, -55.140625, -50.615234375, -46.08984375, -41.564453125, -37.0390625, -32.513671875, -27.98828125, -23.462890625, -18.9375, -14.412109375, -9.88671875, -5.361328125, -0.8359375, 3.689453125, 8.21484375, 12.740234375, 17.265625, 21.791015625, 26.31640625, 30.841796875, 35.3671875, 39.892578125, 44.41796875, 48.943359375, 53.46875, 57.994140625, 62.51953125, 67.044921875, 71.5703125, 76.095703125, 80.62109375, 85.146484375, 89.671875, 94.197265625, 98.72265625, 103.248046875, 107.7734375, 112.298828125, 116.82421875, 121.349609375, 125.875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 10.0, 8.0, 6.0, 13.0, 14.0, 17.0, 15.0, 16.0, 16.0, 20.0, 21.0, 38.0, 44.0, 40.0, 43.0, 35.0, 30.0, 44.0, 41.0, 49.0, 36.0, 57.0, 47.0, 38.0, 42.0, 43.0, 36.0, 36.0, 31.0, 22.0, 20.0, 14.0, 8.0, 9.0, 11.0, 6.0, 6.0, 7.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.84375, -44.10595703125, -42.3681640625, -40.63037109375, -38.892578125, -37.15478515625, -35.4169921875, -33.67919921875, -31.94140625, -30.20361328125, -28.4658203125, -26.72802734375, -24.990234375, -23.25244140625, -21.5146484375, -19.77685546875, -18.0390625, -16.30126953125, -14.5634765625, -12.82568359375, -11.087890625, -9.35009765625, -7.6123046875, -5.87451171875, -4.13671875, -2.39892578125, -0.6611328125, 1.07666015625, 2.814453125, 4.55224609375, 6.2900390625, 8.02783203125, 9.765625, 11.50341796875, 13.2412109375, 14.97900390625, 16.716796875, 18.45458984375, 20.1923828125, 21.93017578125, 23.66796875, 25.40576171875, 27.1435546875, 28.88134765625, 30.619140625, 32.35693359375, 34.0947265625, 35.83251953125, 37.5703125, 39.30810546875, 41.0458984375, 42.78369140625, 44.521484375, 46.25927734375, 47.9970703125, 49.73486328125, 51.47265625, 53.21044921875, 54.9482421875, 56.68603515625, 58.423828125, 60.16162109375, 61.8994140625, 63.63720703125, 65.375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 3.0, 7.0, 9.0, 15.0, 11.0, 15.0, 24.0, 24.0, 49.0, 67.0, 77.0, 129.0, 165.0, 244.0, 399.0, 695.0, 1282.0, 2638.0, 7037.0, 30754.0, 313427.0, 632408.0, 43484.0, 8910.0, 3129.0, 1450.0, 765.0, 433.0, 249.0, 205.0, 133.0, 92.0, 70.0, 49.0, 27.0, 19.0, 18.0, 14.0, 7.0, 12.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-335.25, -325.6953125, -316.140625, -306.5859375, -297.03125, -287.4765625, -277.921875, -268.3671875, -258.8125, -249.2578125, -239.703125, -230.1484375, -220.59375, -211.0390625, -201.484375, -191.9296875, -182.375, -172.8203125, -163.265625, -153.7109375, -144.15625, -134.6015625, -125.046875, -115.4921875, -105.9375, -96.3828125, -86.828125, -77.2734375, -67.71875, -58.1640625, -48.609375, -39.0546875, -29.5, -19.9453125, -10.390625, -0.8359375, 8.71875, 18.2734375, 27.828125, 37.3828125, 46.9375, 56.4921875, 66.046875, 75.6015625, 85.15625, 94.7109375, 104.265625, 113.8203125, 123.375, 132.9296875, 142.484375, 152.0390625, 161.59375, 171.1484375, 180.703125, 190.2578125, 199.8125, 209.3671875, 218.921875, 228.4765625, 238.03125, 247.5859375, 257.140625, 266.6953125, 276.25]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 5.0, 3.0, 2.0, 0.0, 7.0, 8.0, 3.0, 6.0, 11.0, 9.0, 17.0, 25.0, 28.0, 33.0, 36.0, 41.0, 43.0, 47.0, 47.0, 52.0, 63.0, 48.0, 63.0, 58.0, 54.0, 54.0, 49.0, 32.0, 28.0, 27.0, 16.0, 18.0, 11.0, 18.0, 10.0, 12.0, 2.0, 5.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-260.0, -251.1640625, -242.328125, -233.4921875, -224.65625, -215.8203125, -206.984375, -198.1484375, -189.3125, -180.4765625, -171.640625, -162.8046875, -153.96875, -145.1328125, -136.296875, -127.4609375, -118.625, -109.7890625, -100.953125, -92.1171875, -83.28125, -74.4453125, -65.609375, -56.7734375, -47.9375, -39.1015625, -30.265625, -21.4296875, -12.59375, -3.7578125, 5.078125, 13.9140625, 22.75, 31.5859375, 40.421875, 49.2578125, 58.09375, 66.9296875, 75.765625, 84.6015625, 93.4375, 102.2734375, 111.109375, 119.9453125, 128.78125, 137.6171875, 146.453125, 155.2890625, 164.125, 172.9609375, 181.796875, 190.6328125, 199.46875, 208.3046875, 217.140625, 225.9765625, 234.8125, 243.6484375, 252.484375, 261.3203125, 270.15625, 278.9921875, 287.828125, 296.6640625, 305.5]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 0.0, 3.0, 8.0, 6.0, 5.0, 6.0, 12.0, 19.0, 22.0, 36.0, 50.0, 57.0, 100.0, 143.0, 245.0, 382.0, 776.0, 1814.0, 5684.0, 24002.0, 209830.0, 726887.0, 62026.0, 10670.0, 3138.0, 1198.0, 564.0, 328.0, 188.0, 112.0, 70.0, 38.0, 41.0, 23.0, 14.0, 12.0, 6.0, 6.0, 10.0, 10.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-79.0625, -76.5322265625, -74.001953125, -71.4716796875, -68.94140625, -66.4111328125, -63.880859375, -61.3505859375, -58.8203125, -56.2900390625, -53.759765625, -51.2294921875, -48.69921875, -46.1689453125, -43.638671875, -41.1083984375, -38.578125, -36.0478515625, -33.517578125, -30.9873046875, -28.45703125, -25.9267578125, -23.396484375, -20.8662109375, -18.3359375, -15.8056640625, -13.275390625, -10.7451171875, -8.21484375, -5.6845703125, -3.154296875, -0.6240234375, 1.90625, 4.4365234375, 6.966796875, 9.4970703125, 12.02734375, 14.5576171875, 17.087890625, 19.6181640625, 22.1484375, 24.6787109375, 27.208984375, 29.7392578125, 32.26953125, 34.7998046875, 37.330078125, 39.8603515625, 42.390625, 44.9208984375, 47.451171875, 49.9814453125, 52.51171875, 55.0419921875, 57.572265625, 60.1025390625, 62.6328125, 65.1630859375, 67.693359375, 70.2236328125, 72.75390625, 75.2841796875, 77.814453125, 80.3447265625, 82.875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 3.0, 5.0, 8.0, 6.0, 14.0, 6.0, 11.0, 11.0, 13.0, 26.0, 31.0, 31.0, 28.0, 63.0, 54.0, 63.0, 76.0, 73.0, 81.0, 74.0, 44.0, 52.0, 41.0, 43.0, 21.0, 19.0, 22.0, 11.0, 15.0, 12.0, 7.0, 5.0, 7.0, 4.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01324462890625, -0.012779951095581055, -0.01231527328491211, -0.011850595474243164, -0.011385917663574219, -0.010921239852905273, -0.010456562042236328, -0.009991884231567383, -0.009527206420898438, -0.009062528610229492, -0.008597850799560547, -0.008133172988891602, -0.007668495178222656, -0.007203817367553711, -0.006739139556884766, -0.00627446174621582, -0.005809783935546875, -0.00534510612487793, -0.004880428314208984, -0.004415750503540039, -0.003951072692871094, -0.0034863948822021484, -0.003021717071533203, -0.002557039260864258, -0.0020923614501953125, -0.0016276836395263672, -0.0011630058288574219, -0.0006983280181884766, -0.00023365020751953125, 0.00023102760314941406, 0.0006957054138183594, 0.0011603832244873047, 0.00162506103515625, 0.0020897388458251953, 0.0025544166564941406, 0.003019094467163086, 0.0034837722778320312, 0.0039484500885009766, 0.004413127899169922, 0.004877805709838867, 0.0053424835205078125, 0.005807161331176758, 0.006271839141845703, 0.0067365169525146484, 0.007201194763183594, 0.007665872573852539, 0.008130550384521484, 0.00859522819519043, 0.009059906005859375, 0.00952458381652832, 0.009989261627197266, 0.010453939437866211, 0.010918617248535156, 0.011383295059204102, 0.011847972869873047, 0.012312650680541992, 0.012777328491210938, 0.013242006301879883, 0.013706684112548828, 0.014171361923217773, 0.014636039733886719, 0.015100717544555664, 0.01556539535522461, 0.016030073165893555, 0.0164947509765625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 5.0, 5.0, 6.0, 14.0, 10.0, 15.0, 22.0, 29.0, 59.0, 71.0, 105.0, 184.0, 301.0, 576.0, 1164.0, 2585.0, 7952.0, 43219.0, 663927.0, 291682.0, 26555.0, 5759.0, 2100.0, 969.0, 468.0, 289.0, 158.0, 103.0, 54.0, 60.0, 24.0, 25.0, 12.0, 12.0, 9.0, 7.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-76.125, -73.5771484375, -71.029296875, -68.4814453125, -65.93359375, -63.3857421875, -60.837890625, -58.2900390625, -55.7421875, -53.1943359375, -50.646484375, -48.0986328125, -45.55078125, -43.0029296875, -40.455078125, -37.9072265625, -35.359375, -32.8115234375, -30.263671875, -27.7158203125, -25.16796875, -22.6201171875, -20.072265625, -17.5244140625, -14.9765625, -12.4287109375, -9.880859375, -7.3330078125, -4.78515625, -2.2373046875, 0.310546875, 2.8583984375, 5.40625, 7.9541015625, 10.501953125, 13.0498046875, 15.59765625, 18.1455078125, 20.693359375, 23.2412109375, 25.7890625, 28.3369140625, 30.884765625, 33.4326171875, 35.98046875, 38.5283203125, 41.076171875, 43.6240234375, 46.171875, 48.7197265625, 51.267578125, 53.8154296875, 56.36328125, 58.9111328125, 61.458984375, 64.0068359375, 66.5546875, 69.1025390625, 71.650390625, 74.1982421875, 76.74609375, 79.2939453125, 81.841796875, 84.3896484375, 86.9375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 7.0, 1.0, 2.0, 6.0, 13.0, 19.0, 34.0, 42.0, 54.0, 75.0, 75.0, 99.0, 98.0, 95.0, 91.0, 88.0, 51.0, 45.0, 32.0, 24.0, 20.0, 10.0, 8.0, 6.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.5, -62.865234375, -60.23046875, -57.595703125, -54.9609375, -52.326171875, -49.69140625, -47.056640625, -44.421875, -41.787109375, -39.15234375, -36.517578125, -33.8828125, -31.248046875, -28.61328125, -25.978515625, -23.34375, -20.708984375, -18.07421875, -15.439453125, -12.8046875, -10.169921875, -7.53515625, -4.900390625, -2.265625, 0.369140625, 3.00390625, 5.638671875, 8.2734375, 10.908203125, 13.54296875, 16.177734375, 18.8125, 21.447265625, 24.08203125, 26.716796875, 29.3515625, 31.986328125, 34.62109375, 37.255859375, 39.890625, 42.525390625, 45.16015625, 47.794921875, 50.4296875, 53.064453125, 55.69921875, 58.333984375, 60.96875, 63.603515625, 66.23828125, 68.873046875, 71.5078125, 74.142578125, 76.77734375, 79.412109375, 82.046875, 84.681640625, 87.31640625, 89.951171875, 92.5859375, 95.220703125, 97.85546875, 100.490234375, 103.125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 9.0, 12.0, 11.0, 20.0, 44.0, 67.0, 134.0, 274.0, 220.0, 102.0, 52.0, 28.0, 15.0, 6.0, 2.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1750.259765625, -1687.6319580078125, -1625.004150390625, -1562.37646484375, -1499.7486572265625, -1437.120849609375, -1374.4930419921875, -1311.865234375, -1249.2374267578125, -1186.609619140625, -1123.9818115234375, -1061.35400390625, -998.7262573242188, -936.0985107421875, -873.470703125, -810.8428955078125, -748.2151489257812, -685.5873413085938, -622.9595947265625, -560.331787109375, -497.7039794921875, -435.0762023925781, -372.44842529296875, -309.82061767578125, -247.19284057617188, -184.56504821777344, -121.93726348876953, -59.309478759765625, 3.3183135986328125, 65.94610595703125, 128.57388305664062, 191.20169067382812, 253.8294677734375, 316.4572448730469, 379.0850524902344, 441.71282958984375, 504.34063720703125, 566.9683837890625, 629.59619140625, 692.2239990234375, 754.851806640625, 817.4796142578125, 880.1073608398438, 942.7351684570312, 1005.3629760742188, 1067.99072265625, 1130.6185302734375, 1193.246337890625, 1255.8740234375, 1318.5018310546875, 1381.129638671875, 1443.75732421875, 1506.3851318359375, 1569.012939453125, 1631.6407470703125, 1694.2685546875, 1756.8963623046875, 1819.524169921875, 1882.1519775390625, 1944.77978515625, 2007.407470703125, 2070.035400390625, 2132.6630859375, 2195.291015625, 2257.918701171875]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 1.0, 3.0, 4.0, 6.0, 5.0, 9.0, 10.0, 8.0, 13.0, 11.0, 27.0, 21.0, 26.0, 21.0, 27.0, 33.0, 46.0, 41.0, 46.0, 66.0, 80.0, 71.0, 61.0, 41.0, 34.0, 40.0, 28.0, 34.0, 26.0, 28.0, 24.0, 24.0, 18.0, 11.0, 8.0, 6.0, 12.0, 10.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1079.7674560546875, -1048.6453857421875, -1017.5233764648438, -986.4013671875, -955.279296875, -924.1572875976562, -893.0352783203125, -861.9132080078125, -830.7911376953125, -799.6691284179688, -768.5470581054688, -737.425048828125, -706.302978515625, -675.1809692382812, -644.0589599609375, -612.9368896484375, -581.8148803710938, -550.69287109375, -519.57080078125, -488.44879150390625, -457.32672119140625, -426.2047119140625, -395.0826721191406, -363.96063232421875, -332.8385925292969, -301.716552734375, -270.5945129394531, -239.4724884033203, -208.35044860839844, -177.22840881347656, -146.10638427734375, -114.98434448242188, -83.86224365234375, -52.74020767211914, -21.61817169189453, 9.503860473632812, 40.62590026855469, 71.74794006347656, 102.86996459960938, 133.99200439453125, 165.11404418945312, 196.236083984375, 227.35812377929688, 258.48016357421875, 289.6021728515625, 320.7242431640625, 351.84625244140625, 382.9682922363281, 414.09033203125, 445.2123718261719, 476.33441162109375, 507.4564208984375, 538.5784912109375, 569.7005004882812, 600.822509765625, 631.944580078125, 663.066650390625, 694.1886596679688, 725.3107299804688, 756.4327392578125, 787.5548095703125, 818.6768188476562, 849.798828125, 880.9208984375, 912.0429077148438]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 14.0, 26.0, 58.0, 116.0, 292.0, 842.0, 2905.0, 16084.0, 468702.0, 3601310.0, 93837.0, 7511.0, 1670.0, 579.0, 194.0, 65.0, 46.0, 20.0, 9.0, 3.0, 4.0, 0.0, 1.0, 1.0], "bins": [-251.5, -246.3994140625, -241.298828125, -236.1982421875, -231.09765625, -225.9970703125, -220.896484375, -215.7958984375, -210.6953125, -205.5947265625, -200.494140625, -195.3935546875, -190.29296875, -185.1923828125, -180.091796875, -174.9912109375, -169.890625, -164.7900390625, -159.689453125, -154.5888671875, -149.48828125, -144.3876953125, -139.287109375, -134.1865234375, -129.0859375, -123.9853515625, -118.884765625, -113.7841796875, -108.68359375, -103.5830078125, -98.482421875, -93.3818359375, -88.28125, -83.1806640625, -78.080078125, -72.9794921875, -67.87890625, -62.7783203125, -57.677734375, -52.5771484375, -47.4765625, -42.3759765625, -37.275390625, -32.1748046875, -27.07421875, -21.9736328125, -16.873046875, -11.7724609375, -6.671875, -1.5712890625, 3.529296875, 8.6298828125, 13.73046875, 18.8310546875, 23.931640625, 29.0322265625, 34.1328125, 39.2333984375, 44.333984375, 49.4345703125, 54.53515625, 59.6357421875, 64.736328125, 69.8369140625, 74.9375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 5.0, 6.0, 10.0, 8.0, 15.0, 13.0, 14.0, 19.0, 22.0, 24.0, 17.0, 32.0, 28.0, 38.0, 35.0, 32.0, 45.0, 36.0, 44.0, 43.0, 39.0, 47.0, 52.0, 44.0, 45.0, 31.0, 37.0, 36.0, 27.0, 29.0, 14.0, 23.0, 22.0, 14.0, 6.0, 12.0, 6.0, 4.0, 4.0, 6.0, 2.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-48.34375, -46.77783203125, -45.2119140625, -43.64599609375, -42.080078125, -40.51416015625, -38.9482421875, -37.38232421875, -35.81640625, -34.25048828125, -32.6845703125, -31.11865234375, -29.552734375, -27.98681640625, -26.4208984375, -24.85498046875, -23.2890625, -21.72314453125, -20.1572265625, -18.59130859375, -17.025390625, -15.45947265625, -13.8935546875, -12.32763671875, -10.76171875, -9.19580078125, -7.6298828125, -6.06396484375, -4.498046875, -2.93212890625, -1.3662109375, 0.19970703125, 1.765625, 3.33154296875, 4.8974609375, 6.46337890625, 8.029296875, 9.59521484375, 11.1611328125, 12.72705078125, 14.29296875, 15.85888671875, 17.4248046875, 18.99072265625, 20.556640625, 22.12255859375, 23.6884765625, 25.25439453125, 26.8203125, 28.38623046875, 29.9521484375, 31.51806640625, 33.083984375, 34.64990234375, 36.2158203125, 37.78173828125, 39.34765625, 40.91357421875, 42.4794921875, 44.04541015625, 45.611328125, 47.17724609375, 48.7431640625, 50.30908203125, 51.875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 6.0, 6.0, 14.0, 21.0, 26.0, 28.0, 55.0, 87.0, 139.0, 189.0, 410.0, 733.0, 1432.0, 3241.0, 9353.0, 38934.0, 614199.0, 3410800.0, 89621.0, 16335.0, 4747.0, 1866.0, 840.0, 455.0, 262.0, 168.0, 102.0, 66.0, 43.0, 26.0, 34.0, 9.0, 11.0, 12.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-184.125, -178.224609375, -172.32421875, -166.423828125, -160.5234375, -154.623046875, -148.72265625, -142.822265625, -136.921875, -131.021484375, -125.12109375, -119.220703125, -113.3203125, -107.419921875, -101.51953125, -95.619140625, -89.71875, -83.818359375, -77.91796875, -72.017578125, -66.1171875, -60.216796875, -54.31640625, -48.416015625, -42.515625, -36.615234375, -30.71484375, -24.814453125, -18.9140625, -13.013671875, -7.11328125, -1.212890625, 4.6875, 10.587890625, 16.48828125, 22.388671875, 28.2890625, 34.189453125, 40.08984375, 45.990234375, 51.890625, 57.791015625, 63.69140625, 69.591796875, 75.4921875, 81.392578125, 87.29296875, 93.193359375, 99.09375, 104.994140625, 110.89453125, 116.794921875, 122.6953125, 128.595703125, 134.49609375, 140.396484375, 146.296875, 152.197265625, 158.09765625, 163.998046875, 169.8984375, 175.798828125, 181.69921875, 187.599609375, 193.5]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 8.0, 6.0, 9.0, 18.0, 20.0, 36.0, 59.0, 123.0, 196.0, 630.0, 1327.0, 916.0, 361.0, 122.0, 67.0, 54.0, 34.0, 29.0, 11.0, 13.0, 8.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-210.75, -203.66796875, -196.5859375, -189.50390625, -182.421875, -175.33984375, -168.2578125, -161.17578125, -154.09375, -147.01171875, -139.9296875, -132.84765625, -125.765625, -118.68359375, -111.6015625, -104.51953125, -97.4375, -90.35546875, -83.2734375, -76.19140625, -69.109375, -62.02734375, -54.9453125, -47.86328125, -40.78125, -33.69921875, -26.6171875, -19.53515625, -12.453125, -5.37109375, 1.7109375, 8.79296875, 15.875, 22.95703125, 30.0390625, 37.12109375, 44.203125, 51.28515625, 58.3671875, 65.44921875, 72.53125, 79.61328125, 86.6953125, 93.77734375, 100.859375, 107.94140625, 115.0234375, 122.10546875, 129.1875, 136.26953125, 143.3515625, 150.43359375, 157.515625, 164.59765625, 171.6796875, 178.76171875, 185.84375, 192.92578125, 200.0078125, 207.08984375, 214.171875, 221.25390625, 228.3359375, 235.41796875, 242.5]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 1.0, 4.0, 3.0, 6.0, 17.0, 55.0, 131.0, 302.0, 306.0, 104.0, 35.0, 19.0, 4.0, 6.0, 2.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2364.404296875, -2282.893798828125, -2201.38330078125, -2119.872802734375, -2038.3623046875, -1956.851806640625, -1875.3414306640625, -1793.8309326171875, -1712.3204345703125, -1630.8099365234375, -1549.2994384765625, -1467.7889404296875, -1386.278564453125, -1304.76806640625, -1223.257568359375, -1141.7470703125, -1060.236572265625, -978.72607421875, -897.215576171875, -815.7051391601562, -734.1946411132812, -652.6841430664062, -571.1737060546875, -489.6632080078125, -408.1527099609375, -326.6422119140625, -245.13174438476562, -163.6212615966797, -82.11077880859375, -0.60028076171875, 80.91018676757812, 162.420654296875, 243.930908203125, 325.44140625, 406.9518737792969, 488.46234130859375, 569.9728393554688, 651.4833374023438, 732.9937744140625, 814.5042724609375, 896.0147705078125, 977.5252685546875, 1059.0357666015625, 1140.5462646484375, 1222.056640625, 1303.567138671875, 1385.07763671875, 1466.588134765625, 1548.0986328125, 1629.609130859375, 1711.11962890625, 1792.630126953125, 1874.140625, 1955.651123046875, 2037.1614990234375, 2118.671875, 2200.1826171875, 2281.693115234375, 2363.20361328125, 2444.714111328125, 2526.224609375, 2607.735107421875, 2689.24560546875, 2770.755859375, 2852.266357421875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 8.0, 7.0, 4.0, 16.0, 10.0, 13.0, 21.0, 31.0, 31.0, 20.0, 33.0, 34.0, 43.0, 35.0, 52.0, 64.0, 49.0, 60.0, 61.0, 53.0, 45.0, 52.0, 53.0, 29.0, 31.0, 32.0, 28.0, 18.0, 13.0, 6.0, 15.0, 13.0, 6.0, 8.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-959.0203247070312, -931.435546875, -903.8507080078125, -876.2659301757812, -848.6810913085938, -821.0963134765625, -793.511474609375, -765.9266967773438, -738.3419189453125, -710.7571411132812, -683.1723022460938, -655.5875244140625, -628.002685546875, -600.4179077148438, -572.8331298828125, -545.248291015625, -517.6634521484375, -490.0786437988281, -462.49383544921875, -434.9090576171875, -407.32421875, -379.73944091796875, -352.1546325683594, -324.56982421875, -296.9850158691406, -269.40020751953125, -241.81539916992188, -214.23060607910156, -186.6457977294922, -159.0609893798828, -131.4761962890625, -103.89138793945312, -76.3065185546875, -48.72171401977539, -21.13690948486328, 6.4478912353515625, 34.03269958496094, 61.61750793457031, 89.20230102539062, 116.787109375, 144.37191772460938, 171.95672607421875, 199.54153442382812, 227.12632751464844, 254.7111358642578, 282.29595947265625, 309.8807373046875, 337.4655456542969, 365.05035400390625, 392.6351623535156, 420.219970703125, 447.80474853515625, 475.38958740234375, 502.974365234375, 530.5592041015625, 558.1439819335938, 585.728759765625, 613.3135375976562, 640.8983764648438, 668.483154296875, 696.0679931640625, 723.6527709960938, 751.237548828125, 778.8223876953125, 806.4072265625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 6.0, 10.0, 13.0, 16.0, 28.0, 49.0, 69.0, 101.0, 167.0, 264.0, 452.0, 793.0, 1294.0, 2326.0, 4257.0, 8285.0, 16484.0, 34749.0, 77340.0, 178858.0, 325913.0, 217300.0, 95776.0, 42969.0, 19994.0, 9572.0, 4949.0, 2811.0, 1515.0, 878.0, 530.0, 308.0, 162.0, 120.0, 70.0, 47.0, 27.0, 16.0, 18.0, 8.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-100.1875, -97.4521484375, -94.716796875, -91.9814453125, -89.24609375, -86.5107421875, -83.775390625, -81.0400390625, -78.3046875, -75.5693359375, -72.833984375, -70.0986328125, -67.36328125, -64.6279296875, -61.892578125, -59.1572265625, -56.421875, -53.6865234375, -50.951171875, -48.2158203125, -45.48046875, -42.7451171875, -40.009765625, -37.2744140625, -34.5390625, -31.8037109375, -29.068359375, -26.3330078125, -23.59765625, -20.8623046875, -18.126953125, -15.3916015625, -12.65625, -9.9208984375, -7.185546875, -4.4501953125, -1.71484375, 1.0205078125, 3.755859375, 6.4912109375, 9.2265625, 11.9619140625, 14.697265625, 17.4326171875, 20.16796875, 22.9033203125, 25.638671875, 28.3740234375, 31.109375, 33.8447265625, 36.580078125, 39.3154296875, 42.05078125, 44.7861328125, 47.521484375, 50.2568359375, 52.9921875, 55.7275390625, 58.462890625, 61.1982421875, 63.93359375, 66.6689453125, 69.404296875, 72.1396484375, 74.875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 6.0, 3.0, 4.0, 9.0, 7.0, 9.0, 17.0, 15.0, 12.0, 27.0, 27.0, 23.0, 32.0, 30.0, 26.0, 50.0, 37.0, 43.0, 48.0, 46.0, 53.0, 58.0, 43.0, 47.0, 45.0, 43.0, 50.0, 31.0, 24.0, 28.0, 22.0, 14.0, 16.0, 10.0, 11.0, 7.0, 12.0, 8.0, 5.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-77.25, -75.18017578125, -73.1103515625, -71.04052734375, -68.970703125, -66.90087890625, -64.8310546875, -62.76123046875, -60.69140625, -58.62158203125, -56.5517578125, -54.48193359375, -52.412109375, -50.34228515625, -48.2724609375, -46.20263671875, -44.1328125, -42.06298828125, -39.9931640625, -37.92333984375, -35.853515625, -33.78369140625, -31.7138671875, -29.64404296875, -27.57421875, -25.50439453125, -23.4345703125, -21.36474609375, -19.294921875, -17.22509765625, -15.1552734375, -13.08544921875, -11.015625, -8.94580078125, -6.8759765625, -4.80615234375, -2.736328125, -0.66650390625, 1.4033203125, 3.47314453125, 5.54296875, 7.61279296875, 9.6826171875, 11.75244140625, 13.822265625, 15.89208984375, 17.9619140625, 20.03173828125, 22.1015625, 24.17138671875, 26.2412109375, 28.31103515625, 30.380859375, 32.45068359375, 34.5205078125, 36.59033203125, 38.66015625, 40.72998046875, 42.7998046875, 44.86962890625, 46.939453125, 49.00927734375, 51.0791015625, 53.14892578125, 55.21875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 7.0, 1.0, 1.0, 14.0, 19.0, 20.0, 26.0, 42.0, 75.0, 106.0, 159.0, 307.0, 645.0, 1830.0, 6511.0, 34204.0, 333631.0, 614068.0, 45115.0, 7955.0, 2184.0, 830.0, 365.0, 183.0, 86.0, 65.0, 33.0, 24.0, 20.0, 10.0, 6.0, 7.0, 7.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-241.125, -232.830078125, -224.53515625, -216.240234375, -207.9453125, -199.650390625, -191.35546875, -183.060546875, -174.765625, -166.470703125, -158.17578125, -149.880859375, -141.5859375, -133.291015625, -124.99609375, -116.701171875, -108.40625, -100.111328125, -91.81640625, -83.521484375, -75.2265625, -66.931640625, -58.63671875, -50.341796875, -42.046875, -33.751953125, -25.45703125, -17.162109375, -8.8671875, -0.572265625, 7.72265625, 16.017578125, 24.3125, 32.607421875, 40.90234375, 49.197265625, 57.4921875, 65.787109375, 74.08203125, 82.376953125, 90.671875, 98.966796875, 107.26171875, 115.556640625, 123.8515625, 132.146484375, 140.44140625, 148.736328125, 157.03125, 165.326171875, 173.62109375, 181.916015625, 190.2109375, 198.505859375, 206.80078125, 215.095703125, 223.390625, 231.685546875, 239.98046875, 248.275390625, 256.5703125, 264.865234375, 273.16015625, 281.455078125, 289.75]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 9.0, 3.0, 9.0, 15.0, 14.0, 9.0, 18.0, 23.0, 24.0, 20.0, 41.0, 35.0, 58.0, 50.0, 59.0, 53.0, 59.0, 58.0, 37.0, 44.0, 56.0, 37.0, 47.0, 29.0, 31.0, 33.0, 23.0, 19.0, 15.0, 16.0, 14.0, 5.0, 13.0, 9.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-316.75, -308.02734375, -299.3046875, -290.58203125, -281.859375, -273.13671875, -264.4140625, -255.69140625, -246.96875, -238.24609375, -229.5234375, -220.80078125, -212.078125, -203.35546875, -194.6328125, -185.91015625, -177.1875, -168.46484375, -159.7421875, -151.01953125, -142.296875, -133.57421875, -124.8515625, -116.12890625, -107.40625, -98.68359375, -89.9609375, -81.23828125, -72.515625, -63.79296875, -55.0703125, -46.34765625, -37.625, -28.90234375, -20.1796875, -11.45703125, -2.734375, 5.98828125, 14.7109375, 23.43359375, 32.15625, 40.87890625, 49.6015625, 58.32421875, 67.046875, 75.76953125, 84.4921875, 93.21484375, 101.9375, 110.66015625, 119.3828125, 128.10546875, 136.828125, 145.55078125, 154.2734375, 162.99609375, 171.71875, 180.44140625, 189.1640625, 197.88671875, 206.609375, 215.33203125, 224.0546875, 232.77734375, 241.5]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 0.0, 0.0, 4.0, 6.0, 5.0, 7.0, 21.0, 23.0, 23.0, 32.0, 46.0, 86.0, 148.0, 208.0, 390.0, 670.0, 1338.0, 2841.0, 6307.0, 15847.0, 48097.0, 190427.0, 602798.0, 123724.0, 33738.0, 11937.0, 4934.0, 2269.0, 1149.0, 611.0, 325.0, 201.0, 109.0, 79.0, 44.0, 30.0, 21.0, 15.0, 20.0, 8.0, 2.0, 2.0, 6.0, 1.0, 5.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.5625, -41.2470703125, -39.931640625, -38.6162109375, -37.30078125, -35.9853515625, -34.669921875, -33.3544921875, -32.0390625, -30.7236328125, -29.408203125, -28.0927734375, -26.77734375, -25.4619140625, -24.146484375, -22.8310546875, -21.515625, -20.2001953125, -18.884765625, -17.5693359375, -16.25390625, -14.9384765625, -13.623046875, -12.3076171875, -10.9921875, -9.6767578125, -8.361328125, -7.0458984375, -5.73046875, -4.4150390625, -3.099609375, -1.7841796875, -0.46875, 0.8466796875, 2.162109375, 3.4775390625, 4.79296875, 6.1083984375, 7.423828125, 8.7392578125, 10.0546875, 11.3701171875, 12.685546875, 14.0009765625, 15.31640625, 16.6318359375, 17.947265625, 19.2626953125, 20.578125, 21.8935546875, 23.208984375, 24.5244140625, 25.83984375, 27.1552734375, 28.470703125, 29.7861328125, 31.1015625, 32.4169921875, 33.732421875, 35.0478515625, 36.36328125, 37.6787109375, 38.994140625, 40.3095703125, 41.625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 2.0, 3.0, 6.0, 15.0, 12.0, 19.0, 20.0, 39.0, 38.0, 52.0, 89.0, 103.0, 115.0, 119.0, 80.0, 68.0, 53.0, 27.0, 25.0, 23.0, 21.0, 19.0, 11.0, 3.0, 4.0, 5.0, 7.0, 5.0, 2.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.019073486328125, -0.018491744995117188, -0.017910003662109375, -0.017328262329101562, -0.01674652099609375, -0.016164779663085938, -0.015583038330078125, -0.015001296997070312, -0.0144195556640625, -0.013837814331054688, -0.013256072998046875, -0.012674331665039062, -0.01209259033203125, -0.011510848999023438, -0.010929107666015625, -0.010347366333007812, -0.009765625, -0.009183883666992188, -0.008602142333984375, -0.008020401000976562, -0.00743865966796875, -0.0068569183349609375, -0.006275177001953125, -0.0056934356689453125, -0.0051116943359375, -0.0045299530029296875, -0.003948211669921875, -0.0033664703369140625, -0.00278472900390625, -0.0022029876708984375, -0.001621246337890625, -0.0010395050048828125, -0.000457763671875, 0.0001239776611328125, 0.000705718994140625, 0.0012874603271484375, 0.00186920166015625, 0.0024509429931640625, 0.003032684326171875, 0.0036144256591796875, 0.0041961669921875, 0.0047779083251953125, 0.005359649658203125, 0.0059413909912109375, 0.00652313232421875, 0.0071048736572265625, 0.007686614990234375, 0.008268356323242188, 0.00885009765625, 0.009431838989257812, 0.010013580322265625, 0.010595321655273438, 0.01117706298828125, 0.011758804321289062, 0.012340545654296875, 0.012922286987304688, 0.0135040283203125, 0.014085769653320312, 0.014667510986328125, 0.015249252319335938, 0.01583099365234375, 0.016412734985351562, 0.016994476318359375, 0.017576217651367188, 0.018157958984375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 6.0, 8.0, 12.0, 21.0, 28.0, 35.0, 80.0, 119.0, 174.0, 435.0, 965.0, 2586.0, 8236.0, 35498.0, 234592.0, 665371.0, 78117.0, 15261.0, 4100.0, 1520.0, 633.0, 316.0, 158.0, 82.0, 71.0, 48.0, 29.0, 14.0, 6.0, 5.0, 9.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.3125, -62.376953125, -60.44140625, -58.505859375, -56.5703125, -54.634765625, -52.69921875, -50.763671875, -48.828125, -46.892578125, -44.95703125, -43.021484375, -41.0859375, -39.150390625, -37.21484375, -35.279296875, -33.34375, -31.408203125, -29.47265625, -27.537109375, -25.6015625, -23.666015625, -21.73046875, -19.794921875, -17.859375, -15.923828125, -13.98828125, -12.052734375, -10.1171875, -8.181640625, -6.24609375, -4.310546875, -2.375, -0.439453125, 1.49609375, 3.431640625, 5.3671875, 7.302734375, 9.23828125, 11.173828125, 13.109375, 15.044921875, 16.98046875, 18.916015625, 20.8515625, 22.787109375, 24.72265625, 26.658203125, 28.59375, 30.529296875, 32.46484375, 34.400390625, 36.3359375, 38.271484375, 40.20703125, 42.142578125, 44.078125, 46.013671875, 47.94921875, 49.884765625, 51.8203125, 53.755859375, 55.69140625, 57.626953125, 59.5625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 8.0, 8.0, 15.0, 12.0, 19.0, 24.0, 30.0, 29.0, 30.0, 46.0, 65.0, 68.0, 69.0, 85.0, 88.0, 83.0, 67.0, 36.0, 46.0, 32.0, 30.0, 31.0, 20.0, 20.0, 2.0, 10.0, 8.0, 5.0, 4.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-51.90625, -50.1748046875, -48.443359375, -46.7119140625, -44.98046875, -43.2490234375, -41.517578125, -39.7861328125, -38.0546875, -36.3232421875, -34.591796875, -32.8603515625, -31.12890625, -29.3974609375, -27.666015625, -25.9345703125, -24.203125, -22.4716796875, -20.740234375, -19.0087890625, -17.27734375, -15.5458984375, -13.814453125, -12.0830078125, -10.3515625, -8.6201171875, -6.888671875, -5.1572265625, -3.42578125, -1.6943359375, 0.037109375, 1.7685546875, 3.5, 5.2314453125, 6.962890625, 8.6943359375, 10.42578125, 12.1572265625, 13.888671875, 15.6201171875, 17.3515625, 19.0830078125, 20.814453125, 22.5458984375, 24.27734375, 26.0087890625, 27.740234375, 29.4716796875, 31.203125, 32.9345703125, 34.666015625, 36.3974609375, 38.12890625, 39.8603515625, 41.591796875, 43.3232421875, 45.0546875, 46.7861328125, 48.517578125, 50.2490234375, 51.98046875, 53.7119140625, 55.443359375, 57.1748046875, 58.90625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 11.0, 23.0, 49.0, 74.0, 143.0, 303.0, 179.0, 100.0, 55.0, 27.0, 12.0, 7.0, 3.0, 4.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1506.1136474609375, -1456.779296875, -1407.4449462890625, -1358.110595703125, -1308.7762451171875, -1259.44189453125, -1210.1075439453125, -1160.773193359375, -1111.4388427734375, -1062.1044921875, -1012.7701416015625, -963.435791015625, -914.1014404296875, -864.76708984375, -815.4327392578125, -766.098388671875, -716.7640991210938, -667.4297485351562, -618.0953979492188, -568.7610473632812, -519.4266967773438, -470.09234619140625, -420.7580261230469, -371.4236755371094, -322.0893249511719, -272.7549743652344, -223.42062377929688, -174.08628845214844, -124.75193786621094, -75.41758728027344, -26.083251953125, 23.2510986328125, 72.58544921875, 121.9197998046875, 171.254150390625, 220.58848571777344, 269.9228515625, 319.2572021484375, 368.5915222167969, 417.9258728027344, 467.2602233886719, 516.5945434570312, 565.9288940429688, 615.2632446289062, 664.5975952148438, 713.9319458007812, 763.2662963867188, 812.6006469726562, 861.9349975585938, 911.2693481445312, 960.6036987304688, 1009.9380493164062, 1059.2723388671875, 1108.606689453125, 1157.9410400390625, 1207.275390625, 1256.6097412109375, 1305.944091796875, 1355.2784423828125, 1404.61279296875, 1453.9471435546875, 1503.281494140625, 1552.6158447265625, 1601.9501953125, 1651.2845458984375]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 4.0, 4.0, 6.0, 10.0, 17.0, 17.0, 18.0, 19.0, 27.0, 30.0, 18.0, 34.0, 36.0, 39.0, 58.0, 58.0, 74.0, 85.0, 71.0, 66.0, 29.0, 45.0, 35.0, 36.0, 23.0, 24.0, 14.0, 17.0, 19.0, 17.0, 13.0, 7.0, 9.0, 5.0, 5.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-986.72607421875, -953.2200927734375, -919.7140502929688, -886.2080688476562, -852.7020263671875, -819.196044921875, -785.6900634765625, -752.18408203125, -718.6780395507812, -685.1720581054688, -651.666015625, -618.1600341796875, -584.654052734375, -551.1480102539062, -517.6420288085938, -484.1360168457031, -450.6300048828125, -417.1239929199219, -383.61798095703125, -350.11199951171875, -316.6059875488281, -283.0999755859375, -249.59397888183594, -216.08798217773438, -182.58197021484375, -149.07595825195312, -115.56996154785156, -82.06395721435547, -48.557952880859375, -15.05194091796875, 18.454055786132812, 51.960052490234375, 85.4661865234375, 118.9721908569336, 152.4781951904297, 185.98419189453125, 219.49020385742188, 252.9962158203125, 286.502197265625, 320.0082092285156, 353.51422119140625, 387.0202331542969, 420.5262451171875, 454.0322265625, 487.5382385253906, 521.0442504882812, 554.5502319335938, 588.0562744140625, 621.562255859375, 655.0682373046875, 688.5742797851562, 722.0802612304688, 755.5863037109375, 789.09228515625, 822.5982666015625, 856.104248046875, 889.6102905273438, 923.1162719726562, 956.622314453125, 990.1282958984375, 1023.63427734375, 1057.140380859375, 1090.6463623046875, 1124.15234375, 1157.6583251953125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 16.0, 29.0, 23.0, 51.0, 87.0, 162.0, 323.0, 730.0, 1927.0, 6747.0, 65608.0, 2749420.0, 1323550.0, 37699.0, 5205.0, 1557.0, 593.0, 253.0, 119.0, 79.0, 36.0, 16.0, 20.0, 6.0, 7.0, 8.0, 2.0, 0.0, 1.0], "bins": [-216.75, -212.1279296875, -207.505859375, -202.8837890625, -198.26171875, -193.6396484375, -189.017578125, -184.3955078125, -179.7734375, -175.1513671875, -170.529296875, -165.9072265625, -161.28515625, -156.6630859375, -152.041015625, -147.4189453125, -142.796875, -138.1748046875, -133.552734375, -128.9306640625, -124.30859375, -119.6865234375, -115.064453125, -110.4423828125, -105.8203125, -101.1982421875, -96.576171875, -91.9541015625, -87.33203125, -82.7099609375, -78.087890625, -73.4658203125, -68.84375, -64.2216796875, -59.599609375, -54.9775390625, -50.35546875, -45.7333984375, -41.111328125, -36.4892578125, -31.8671875, -27.2451171875, -22.623046875, -18.0009765625, -13.37890625, -8.7568359375, -4.134765625, 0.4873046875, 5.109375, 9.7314453125, 14.353515625, 18.9755859375, 23.59765625, 28.2197265625, 32.841796875, 37.4638671875, 42.0859375, 46.7080078125, 51.330078125, 55.9521484375, 60.57421875, 65.1962890625, 69.818359375, 74.4404296875, 79.0625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 3.0, 4.0, 7.0, 10.0, 5.0, 9.0, 18.0, 8.0, 15.0, 11.0, 17.0, 23.0, 29.0, 35.0, 26.0, 27.0, 47.0, 32.0, 38.0, 38.0, 51.0, 50.0, 46.0, 56.0, 43.0, 33.0, 46.0, 36.0, 30.0, 40.0, 30.0, 24.0, 19.0, 22.0, 9.0, 12.0, 10.0, 8.0, 8.0, 9.0, 6.0, 2.0, 2.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-57.5625, -55.7939453125, -54.025390625, -52.2568359375, -50.48828125, -48.7197265625, -46.951171875, -45.1826171875, -43.4140625, -41.6455078125, -39.876953125, -38.1083984375, -36.33984375, -34.5712890625, -32.802734375, -31.0341796875, -29.265625, -27.4970703125, -25.728515625, -23.9599609375, -22.19140625, -20.4228515625, -18.654296875, -16.8857421875, -15.1171875, -13.3486328125, -11.580078125, -9.8115234375, -8.04296875, -6.2744140625, -4.505859375, -2.7373046875, -0.96875, 0.7998046875, 2.568359375, 4.3369140625, 6.10546875, 7.8740234375, 9.642578125, 11.4111328125, 13.1796875, 14.9482421875, 16.716796875, 18.4853515625, 20.25390625, 22.0224609375, 23.791015625, 25.5595703125, 27.328125, 29.0966796875, 30.865234375, 32.6337890625, 34.40234375, 36.1708984375, 37.939453125, 39.7080078125, 41.4765625, 43.2451171875, 45.013671875, 46.7822265625, 48.55078125, 50.3193359375, 52.087890625, 53.8564453125, 55.625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 13.0, 11.0, 24.0, 44.0, 106.0, 216.0, 409.0, 911.0, 2154.0, 8592.0, 98102.0, 3992768.0, 79555.0, 7809.0, 1944.0, 855.0, 395.0, 194.0, 70.0, 48.0, 25.0, 13.0, 7.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-313.75, -304.6484375, -295.546875, -286.4453125, -277.34375, -268.2421875, -259.140625, -250.0390625, -240.9375, -231.8359375, -222.734375, -213.6328125, -204.53125, -195.4296875, -186.328125, -177.2265625, -168.125, -159.0234375, -149.921875, -140.8203125, -131.71875, -122.6171875, -113.515625, -104.4140625, -95.3125, -86.2109375, -77.109375, -68.0078125, -58.90625, -49.8046875, -40.703125, -31.6015625, -22.5, -13.3984375, -4.296875, 4.8046875, 13.90625, 23.0078125, 32.109375, 41.2109375, 50.3125, 59.4140625, 68.515625, 77.6171875, 86.71875, 95.8203125, 104.921875, 114.0234375, 123.125, 132.2265625, 141.328125, 150.4296875, 159.53125, 168.6328125, 177.734375, 186.8359375, 195.9375, 205.0390625, 214.140625, 223.2421875, 232.34375, 241.4453125, 250.546875, 259.6484375, 268.75]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 6.0, 5.0, 12.0, 30.0, 25.0, 46.0, 102.0, 281.0, 816.0, 1483.0, 783.0, 254.0, 95.0, 46.0, 26.0, 25.0, 5.0, 12.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-260.75, -252.732421875, -244.71484375, -236.697265625, -228.6796875, -220.662109375, -212.64453125, -204.626953125, -196.609375, -188.591796875, -180.57421875, -172.556640625, -164.5390625, -156.521484375, -148.50390625, -140.486328125, -132.46875, -124.451171875, -116.43359375, -108.416015625, -100.3984375, -92.380859375, -84.36328125, -76.345703125, -68.328125, -60.310546875, -52.29296875, -44.275390625, -36.2578125, -28.240234375, -20.22265625, -12.205078125, -4.1875, 3.830078125, 11.84765625, 19.865234375, 27.8828125, 35.900390625, 43.91796875, 51.935546875, 59.953125, 67.970703125, 75.98828125, 84.005859375, 92.0234375, 100.041015625, 108.05859375, 116.076171875, 124.09375, 132.111328125, 140.12890625, 148.146484375, 156.1640625, 164.181640625, 172.19921875, 180.216796875, 188.234375, 196.251953125, 204.26953125, 212.287109375, 220.3046875, 228.322265625, 236.33984375, 244.357421875, 252.375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 4.0, 5.0, 13.0, 21.0, 92.0, 282.0, 387.0, 140.0, 40.0, 16.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4348.564453125, -4254.642578125, -4160.72021484375, -4066.79833984375, -3972.876220703125, -3878.9541015625, -3785.031982421875, -3691.10986328125, -3597.187744140625, -3503.265625, -3409.343505859375, -3315.42138671875, -3221.49951171875, -3127.577392578125, -3033.6552734375, -2939.733154296875, -2845.81103515625, -2751.888916015625, -2657.966796875, -2564.044921875, -2470.122802734375, -2376.20068359375, -2282.278564453125, -2188.3564453125, -2094.4345703125, -2000.512451171875, -1906.5904541015625, -1812.6683349609375, -1718.7462158203125, -1624.82421875, -1530.902099609375, -1436.97998046875, -1343.0577392578125, -1249.1356201171875, -1155.213623046875, -1061.29150390625, -967.369384765625, -873.4473266601562, -779.5252685546875, -685.6031494140625, -591.6810913085938, -497.7590026855469, -403.8369140625, -309.91485595703125, -215.99276733398438, -122.0706787109375, -28.14862060546875, 65.77349853515625, 159.695556640625, 253.61764526367188, 347.53973388671875, 441.4617919921875, 535.3839111328125, 629.3059692382812, 723.22802734375, 817.150146484375, 911.0722045898438, 1004.9942626953125, 1098.9163818359375, 1192.83837890625, 1286.760498046875, 1380.6826171875, 1474.604736328125, 1568.52685546875, 1662.4488525390625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 2.0, 6.0, 6.0, 9.0, 9.0, 11.0, 21.0, 12.0, 12.0, 32.0, 23.0, 34.0, 44.0, 30.0, 33.0, 39.0, 25.0, 48.0, 36.0, 45.0, 43.0, 27.0, 42.0, 42.0, 45.0, 41.0, 32.0, 44.0, 31.0, 30.0, 30.0, 21.0, 15.0, 18.0, 14.0, 8.0, 5.0, 6.0, 6.0, 5.0, 5.0, 4.0, 6.0, 1.0, 2.0, 3.0, 3.0], "bins": [-732.2766723632812, -712.4835815429688, -692.6904907226562, -672.8973999023438, -653.1043090820312, -633.3112182617188, -613.5181274414062, -593.7250366210938, -573.9319458007812, -554.1388549804688, -534.3457641601562, -514.5526733398438, -494.75958251953125, -474.96649169921875, -455.17340087890625, -435.38031005859375, -415.58721923828125, -395.79412841796875, -376.00103759765625, -356.20794677734375, -336.41485595703125, -316.62176513671875, -296.82867431640625, -277.03558349609375, -257.24249267578125, -237.44940185546875, -217.65631103515625, -197.86322021484375, -178.07012939453125, -158.27703857421875, -138.48394775390625, -118.69085693359375, -98.8978271484375, -79.104736328125, -59.3116455078125, -39.5185546875, -19.7254638671875, 0.067626953125, 19.8607177734375, 39.65380859375, 59.4468994140625, 79.239990234375, 99.0330810546875, 118.826171875, 138.6192626953125, 158.412353515625, 178.2054443359375, 197.99853515625, 217.7916259765625, 237.584716796875, 257.3778076171875, 277.1708984375, 296.9639892578125, 316.757080078125, 336.5501708984375, 356.34326171875, 376.1363525390625, 395.929443359375, 415.7225341796875, 435.515625, 455.3087158203125, 475.101806640625, 494.8948974609375, 514.68798828125, 534.4810791015625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 6.0, 9.0, 11.0, 26.0, 28.0, 32.0, 69.0, 96.0, 133.0, 165.0, 337.0, 448.0, 787.0, 1375.0, 2443.0, 4550.0, 8867.0, 18547.0, 41183.0, 99288.0, 261580.0, 353640.0, 146523.0, 58069.0, 25159.0, 11735.0, 6061.0, 3104.0, 1728.0, 951.0, 571.0, 353.0, 224.0, 142.0, 96.0, 59.0, 51.0, 27.0, 18.0, 16.0, 13.0, 3.0, 6.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0], "bins": [-95.5625, -92.84765625, -90.1328125, -87.41796875, -84.703125, -81.98828125, -79.2734375, -76.55859375, -73.84375, -71.12890625, -68.4140625, -65.69921875, -62.984375, -60.26953125, -57.5546875, -54.83984375, -52.125, -49.41015625, -46.6953125, -43.98046875, -41.265625, -38.55078125, -35.8359375, -33.12109375, -30.40625, -27.69140625, -24.9765625, -22.26171875, -19.546875, -16.83203125, -14.1171875, -11.40234375, -8.6875, -5.97265625, -3.2578125, -0.54296875, 2.171875, 4.88671875, 7.6015625, 10.31640625, 13.03125, 15.74609375, 18.4609375, 21.17578125, 23.890625, 26.60546875, 29.3203125, 32.03515625, 34.75, 37.46484375, 40.1796875, 42.89453125, 45.609375, 48.32421875, 51.0390625, 53.75390625, 56.46875, 59.18359375, 61.8984375, 64.61328125, 67.328125, 70.04296875, 72.7578125, 75.47265625, 78.1875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 4.0, 5.0, 6.0, 7.0, 7.0, 11.0, 10.0, 13.0, 20.0, 11.0, 12.0, 30.0, 23.0, 32.0, 46.0, 38.0, 51.0, 46.0, 44.0, 49.0, 54.0, 65.0, 61.0, 42.0, 32.0, 46.0, 43.0, 46.0, 22.0, 29.0, 19.0, 18.0, 15.0, 9.0, 6.0, 5.0, 9.0, 4.0, 2.0, 3.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-69.5, -67.3359375, -65.171875, -63.0078125, -60.84375, -58.6796875, -56.515625, -54.3515625, -52.1875, -50.0234375, -47.859375, -45.6953125, -43.53125, -41.3671875, -39.203125, -37.0390625, -34.875, -32.7109375, -30.546875, -28.3828125, -26.21875, -24.0546875, -21.890625, -19.7265625, -17.5625, -15.3984375, -13.234375, -11.0703125, -8.90625, -6.7421875, -4.578125, -2.4140625, -0.25, 1.9140625, 4.078125, 6.2421875, 8.40625, 10.5703125, 12.734375, 14.8984375, 17.0625, 19.2265625, 21.390625, 23.5546875, 25.71875, 27.8828125, 30.046875, 32.2109375, 34.375, 36.5390625, 38.703125, 40.8671875, 43.03125, 45.1953125, 47.359375, 49.5234375, 51.6875, 53.8515625, 56.015625, 58.1796875, 60.34375, 62.5078125, 64.671875, 66.8359375, 69.0]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 10.0, 10.0, 9.0, 17.0, 35.0, 37.0, 75.0, 120.0, 187.0, 329.0, 646.0, 1541.0, 5309.0, 36634.0, 772970.0, 209667.0, 15502.0, 3126.0, 1132.0, 542.0, 241.0, 138.0, 81.0, 65.0, 34.0, 28.0, 16.0, 15.0, 12.0, 6.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-288.5, -279.4296875, -270.359375, -261.2890625, -252.21875, -243.1484375, -234.078125, -225.0078125, -215.9375, -206.8671875, -197.796875, -188.7265625, -179.65625, -170.5859375, -161.515625, -152.4453125, -143.375, -134.3046875, -125.234375, -116.1640625, -107.09375, -98.0234375, -88.953125, -79.8828125, -70.8125, -61.7421875, -52.671875, -43.6015625, -34.53125, -25.4609375, -16.390625, -7.3203125, 1.75, 10.8203125, 19.890625, 28.9609375, 38.03125, 47.1015625, 56.171875, 65.2421875, 74.3125, 83.3828125, 92.453125, 101.5234375, 110.59375, 119.6640625, 128.734375, 137.8046875, 146.875, 155.9453125, 165.015625, 174.0859375, 183.15625, 192.2265625, 201.296875, 210.3671875, 219.4375, 228.5078125, 237.578125, 246.6484375, 255.71875, 264.7890625, 273.859375, 282.9296875, 292.0]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 6.0, 1.0, 5.0, 5.0, 12.0, 8.0, 11.0, 14.0, 13.0, 15.0, 20.0, 28.0, 25.0, 33.0, 41.0, 41.0, 44.0, 53.0, 57.0, 60.0, 56.0, 60.0, 55.0, 41.0, 47.0, 49.0, 26.0, 34.0, 26.0, 30.0, 19.0, 18.0, 12.0, 8.0, 11.0, 3.0, 3.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-229.125, -220.884765625, -212.64453125, -204.404296875, -196.1640625, -187.923828125, -179.68359375, -171.443359375, -163.203125, -154.962890625, -146.72265625, -138.482421875, -130.2421875, -122.001953125, -113.76171875, -105.521484375, -97.28125, -89.041015625, -80.80078125, -72.560546875, -64.3203125, -56.080078125, -47.83984375, -39.599609375, -31.359375, -23.119140625, -14.87890625, -6.638671875, 1.6015625, 9.841796875, 18.08203125, 26.322265625, 34.5625, 42.802734375, 51.04296875, 59.283203125, 67.5234375, 75.763671875, 84.00390625, 92.244140625, 100.484375, 108.724609375, 116.96484375, 125.205078125, 133.4453125, 141.685546875, 149.92578125, 158.166015625, 166.40625, 174.646484375, 182.88671875, 191.126953125, 199.3671875, 207.607421875, 215.84765625, 224.087890625, 232.328125, 240.568359375, 248.80859375, 257.048828125, 265.2890625, 273.529296875, 281.76953125, 290.009765625, 298.25]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 10.0, 6.0, 10.0, 10.0, 17.0, 35.0, 31.0, 60.0, 94.0, 157.0, 261.0, 412.0, 782.0, 1664.0, 4336.0, 14555.0, 73803.0, 782409.0, 137546.0, 22028.0, 5926.0, 2171.0, 968.0, 504.0, 272.0, 180.0, 104.0, 60.0, 54.0, 23.0, 24.0, 13.0, 10.0, 11.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.4375, -64.26953125, -62.1015625, -59.93359375, -57.765625, -55.59765625, -53.4296875, -51.26171875, -49.09375, -46.92578125, -44.7578125, -42.58984375, -40.421875, -38.25390625, -36.0859375, -33.91796875, -31.75, -29.58203125, -27.4140625, -25.24609375, -23.078125, -20.91015625, -18.7421875, -16.57421875, -14.40625, -12.23828125, -10.0703125, -7.90234375, -5.734375, -3.56640625, -1.3984375, 0.76953125, 2.9375, 5.10546875, 7.2734375, 9.44140625, 11.609375, 13.77734375, 15.9453125, 18.11328125, 20.28125, 22.44921875, 24.6171875, 26.78515625, 28.953125, 31.12109375, 33.2890625, 35.45703125, 37.625, 39.79296875, 41.9609375, 44.12890625, 46.296875, 48.46484375, 50.6328125, 52.80078125, 54.96875, 57.13671875, 59.3046875, 61.47265625, 63.640625, 65.80859375, 67.9765625, 70.14453125, 72.3125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 5.0, 9.0, 22.0, 25.0, 55.0, 131.0, 370.0, 211.0, 81.0, 43.0, 22.0, 13.0, 5.0, 3.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0709228515625, -0.06913566589355469, -0.06734848022460938, -0.06556129455566406, -0.06377410888671875, -0.06198692321777344, -0.060199737548828125, -0.05841255187988281, -0.0566253662109375, -0.05483818054199219, -0.053050994873046875, -0.05126380920410156, -0.04947662353515625, -0.04768943786621094, -0.045902252197265625, -0.04411506652832031, -0.042327880859375, -0.04054069519042969, -0.038753509521484375, -0.03696632385253906, -0.03517913818359375, -0.03339195251464844, -0.031604766845703125, -0.029817581176757812, -0.0280303955078125, -0.026243209838867188, -0.024456024169921875, -0.022668838500976562, -0.02088165283203125, -0.019094467163085938, -0.017307281494140625, -0.015520095825195312, -0.01373291015625, -0.011945724487304688, -0.010158538818359375, -0.008371353149414062, -0.00658416748046875, -0.0047969818115234375, -0.003009796142578125, -0.0012226104736328125, 0.0005645751953125, 0.0023517608642578125, 0.004138946533203125, 0.0059261322021484375, 0.00771331787109375, 0.009500503540039062, 0.011287689208984375, 0.013074874877929688, 0.014862060546875, 0.016649246215820312, 0.018436431884765625, 0.020223617553710938, 0.02201080322265625, 0.023797988891601562, 0.025585174560546875, 0.027372360229492188, 0.0291595458984375, 0.030946731567382812, 0.032733917236328125, 0.03452110290527344, 0.03630828857421875, 0.03809547424316406, 0.039882659912109375, 0.04166984558105469, 0.04345703125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 11.0, 8.0, 17.0, 27.0, 32.0, 56.0, 76.0, 127.0, 210.0, 388.0, 698.0, 1509.0, 3690.0, 11152.0, 49856.0, 702561.0, 235512.0, 29704.0, 7594.0, 2743.0, 1162.0, 569.0, 341.0, 165.0, 109.0, 68.0, 43.0, 38.0, 21.0, 18.0, 10.0, 6.0, 6.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-66.875, -64.70703125, -62.5390625, -60.37109375, -58.203125, -56.03515625, -53.8671875, -51.69921875, -49.53125, -47.36328125, -45.1953125, -43.02734375, -40.859375, -38.69140625, -36.5234375, -34.35546875, -32.1875, -30.01953125, -27.8515625, -25.68359375, -23.515625, -21.34765625, -19.1796875, -17.01171875, -14.84375, -12.67578125, -10.5078125, -8.33984375, -6.171875, -4.00390625, -1.8359375, 0.33203125, 2.5, 4.66796875, 6.8359375, 9.00390625, 11.171875, 13.33984375, 15.5078125, 17.67578125, 19.84375, 22.01171875, 24.1796875, 26.34765625, 28.515625, 30.68359375, 32.8515625, 35.01953125, 37.1875, 39.35546875, 41.5234375, 43.69140625, 45.859375, 48.02734375, 50.1953125, 52.36328125, 54.53125, 56.69921875, 58.8671875, 61.03515625, 63.203125, 65.37109375, 67.5390625, 69.70703125, 71.875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 8.0, 5.0, 6.0, 12.0, 18.0, 22.0, 31.0, 34.0, 47.0, 65.0, 86.0, 139.0, 145.0, 96.0, 92.0, 39.0, 36.0, 33.0, 15.0, 14.0, 11.0, 10.0, 4.0, 8.0, 10.0, 5.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.25, -68.0771484375, -65.904296875, -63.7314453125, -61.55859375, -59.3857421875, -57.212890625, -55.0400390625, -52.8671875, -50.6943359375, -48.521484375, -46.3486328125, -44.17578125, -42.0029296875, -39.830078125, -37.6572265625, -35.484375, -33.3115234375, -31.138671875, -28.9658203125, -26.79296875, -24.6201171875, -22.447265625, -20.2744140625, -18.1015625, -15.9287109375, -13.755859375, -11.5830078125, -9.41015625, -7.2373046875, -5.064453125, -2.8916015625, -0.71875, 1.4541015625, 3.626953125, 5.7998046875, 7.97265625, 10.1455078125, 12.318359375, 14.4912109375, 16.6640625, 18.8369140625, 21.009765625, 23.1826171875, 25.35546875, 27.5283203125, 29.701171875, 31.8740234375, 34.046875, 36.2197265625, 38.392578125, 40.5654296875, 42.73828125, 44.9111328125, 47.083984375, 49.2568359375, 51.4296875, 53.6025390625, 55.775390625, 57.9482421875, 60.12109375, 62.2939453125, 64.466796875, 66.6396484375, 68.8125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 9.0, 15.0, 30.0, 54.0, 135.0, 406.0, 170.0, 100.0, 40.0, 20.0, 13.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1918.5721435546875, -1855.9722900390625, -1793.3724365234375, -1730.772705078125, -1668.1728515625, -1605.572998046875, -1542.97314453125, -1480.373291015625, -1417.7734375, -1355.173583984375, -1292.57373046875, -1229.973876953125, -1167.3741455078125, -1104.7742919921875, -1042.1744384765625, -979.5745849609375, -916.974853515625, -854.375, -791.7752075195312, -729.1753540039062, -666.5755615234375, -603.9757080078125, -541.3758544921875, -478.7760314941406, -416.17620849609375, -353.5763854980469, -290.9765625, -228.376708984375, -165.77688598632812, -103.17706298828125, -40.57720947265625, 22.022613525390625, 84.62255859375, 147.22238159179688, 209.8222198486328, 272.42205810546875, 335.0218811035156, 397.6217041015625, 460.2215576171875, 522.8214111328125, 585.4212036132812, 648.0210571289062, 710.620849609375, 773.220703125, 835.820556640625, 898.4203491210938, 961.0202026367188, 1023.6199951171875, 1086.2198486328125, 1148.8197021484375, 1211.4195556640625, 1274.019287109375, 1336.619140625, 1399.218994140625, 1461.81884765625, 1524.418701171875, 1587.0185546875, 1649.618408203125, 1712.21826171875, 1774.818115234375, 1837.4178466796875, 1900.0177001953125, 1962.6175537109375, 2025.2174072265625, 2087.817138671875]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 9.0, 9.0, 7.0, 11.0, 6.0, 12.0, 15.0, 13.0, 26.0, 20.0, 26.0, 27.0, 33.0, 30.0, 43.0, 47.0, 86.0, 93.0, 95.0, 66.0, 55.0, 36.0, 38.0, 28.0, 26.0, 19.0, 21.0, 12.0, 13.0, 13.0, 12.0, 9.0, 9.0, 5.0, 7.0, 5.0, 8.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-868.7910766601562, -840.6497192382812, -812.5083618164062, -784.3670043945312, -756.2256469726562, -728.084228515625, -699.94287109375, -671.801513671875, -643.66015625, -615.518798828125, -587.37744140625, -559.236083984375, -531.0947265625, -502.9533386230469, -474.8119812011719, -446.67059326171875, -418.5292663574219, -390.3879089355469, -362.2465515136719, -334.10516357421875, -305.96380615234375, -277.82244873046875, -249.68109130859375, -221.5397186279297, -193.3983612060547, -165.2570037841797, -137.11563110351562, -108.97427368164062, -80.8329086303711, -52.69154357910156, -24.550186157226562, 3.5911865234375, 31.7325439453125, 59.87390899658203, 88.01527404785156, 116.15663146972656, 144.29800415039062, 172.43936157226562, 200.58071899414062, 228.7220916748047, 256.86346435546875, 285.00482177734375, 313.14617919921875, 341.28753662109375, 369.4289245605469, 397.5702819824219, 425.7116394042969, 453.85302734375, 481.9943542480469, 510.1357116699219, 538.277099609375, 566.41845703125, 594.559814453125, 622.701171875, 650.842529296875, 678.98388671875, 707.125244140625, 735.2666015625, 763.407958984375, 791.54931640625, 819.690673828125, 847.83203125, 875.973388671875, 904.1148071289062, 932.2561645507812]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 11.0, 6.0, 18.0, 9.0, 11.0, 7.0, 9.0, 17.0, 30.0, 35.0, 38.0, 33.0, 52.0, 78.0, 144.0, 240.0, 473.0, 1058.0, 2870.0, 13088.0, 192269.0, 3493202.0, 461914.0, 22195.0, 3903.0, 1230.0, 520.0, 261.0, 153.0, 97.0, 63.0, 58.0, 58.0, 30.0, 20.0, 24.0, 15.0, 12.0, 12.0, 8.0, 9.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-189.75, -184.705078125, -179.66015625, -174.615234375, -169.5703125, -164.525390625, -159.48046875, -154.435546875, -149.390625, -144.345703125, -139.30078125, -134.255859375, -129.2109375, -124.166015625, -119.12109375, -114.076171875, -109.03125, -103.986328125, -98.94140625, -93.896484375, -88.8515625, -83.806640625, -78.76171875, -73.716796875, -68.671875, -63.626953125, -58.58203125, -53.537109375, -48.4921875, -43.447265625, -38.40234375, -33.357421875, -28.3125, -23.267578125, -18.22265625, -13.177734375, -8.1328125, -3.087890625, 1.95703125, 7.001953125, 12.046875, 17.091796875, 22.13671875, 27.181640625, 32.2265625, 37.271484375, 42.31640625, 47.361328125, 52.40625, 57.451171875, 62.49609375, 67.541015625, 72.5859375, 77.630859375, 82.67578125, 87.720703125, 92.765625, 97.810546875, 102.85546875, 107.900390625, 112.9453125, 117.990234375, 123.03515625, 128.080078125, 133.125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 9.0, 8.0, 6.0, 9.0, 15.0, 18.0, 14.0, 22.0, 21.0, 30.0, 40.0, 36.0, 44.0, 42.0, 47.0, 56.0, 56.0, 66.0, 57.0, 53.0, 47.0, 33.0, 48.0, 42.0, 42.0, 28.0, 19.0, 14.0, 23.0, 15.0, 13.0, 8.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.6875, -67.51953125, -65.3515625, -63.18359375, -61.015625, -58.84765625, -56.6796875, -54.51171875, -52.34375, -50.17578125, -48.0078125, -45.83984375, -43.671875, -41.50390625, -39.3359375, -37.16796875, -35.0, -32.83203125, -30.6640625, -28.49609375, -26.328125, -24.16015625, -21.9921875, -19.82421875, -17.65625, -15.48828125, -13.3203125, -11.15234375, -8.984375, -6.81640625, -4.6484375, -2.48046875, -0.3125, 1.85546875, 4.0234375, 6.19140625, 8.359375, 10.52734375, 12.6953125, 14.86328125, 17.03125, 19.19921875, 21.3671875, 23.53515625, 25.703125, 27.87109375, 30.0390625, 32.20703125, 34.375, 36.54296875, 38.7109375, 40.87890625, 43.046875, 45.21484375, 47.3828125, 49.55078125, 51.71875, 53.88671875, 56.0546875, 58.22265625, 60.390625, 62.55859375, 64.7265625, 66.89453125, 69.0625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 5.0, 11.0, 13.0, 18.0, 26.0, 42.0, 73.0, 137.0, 257.0, 669.0, 1966.0, 9693.0, 137745.0, 3983115.0, 52064.0, 6027.0, 1447.0, 500.0, 216.0, 88.0, 83.0, 33.0, 23.0, 18.0, 8.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-411.5, -401.046875, -390.59375, -380.140625, -369.6875, -359.234375, -348.78125, -338.328125, -327.875, -317.421875, -306.96875, -296.515625, -286.0625, -275.609375, -265.15625, -254.703125, -244.25, -233.796875, -223.34375, -212.890625, -202.4375, -191.984375, -181.53125, -171.078125, -160.625, -150.171875, -139.71875, -129.265625, -118.8125, -108.359375, -97.90625, -87.453125, -77.0, -66.546875, -56.09375, -45.640625, -35.1875, -24.734375, -14.28125, -3.828125, 6.625, 17.078125, 27.53125, 37.984375, 48.4375, 58.890625, 69.34375, 79.796875, 90.25, 100.703125, 111.15625, 121.609375, 132.0625, 142.515625, 152.96875, 163.421875, 173.875, 184.328125, 194.78125, 205.234375, 215.6875, 226.140625, 236.59375, 247.046875, 257.5]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 9.0, 7.0, 8.0, 9.0, 22.0, 17.0, 33.0, 66.0, 174.0, 503.0, 1237.0, 1200.0, 421.0, 171.0, 68.0, 51.0, 23.0, 24.0, 13.0, 5.0, 4.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-333.75, -324.728515625, -315.70703125, -306.685546875, -297.6640625, -288.642578125, -279.62109375, -270.599609375, -261.578125, -252.556640625, -243.53515625, -234.513671875, -225.4921875, -216.470703125, -207.44921875, -198.427734375, -189.40625, -180.384765625, -171.36328125, -162.341796875, -153.3203125, -144.298828125, -135.27734375, -126.255859375, -117.234375, -108.212890625, -99.19140625, -90.169921875, -81.1484375, -72.126953125, -63.10546875, -54.083984375, -45.0625, -36.041015625, -27.01953125, -17.998046875, -8.9765625, 0.044921875, 9.06640625, 18.087890625, 27.109375, 36.130859375, 45.15234375, 54.173828125, 63.1953125, 72.216796875, 81.23828125, 90.259765625, 99.28125, 108.302734375, 117.32421875, 126.345703125, 135.3671875, 144.388671875, 153.41015625, 162.431640625, 171.453125, 180.474609375, 189.49609375, 198.517578125, 207.5390625, 216.560546875, 225.58203125, 234.603515625, 243.625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 8.0, 8.0, 20.0, 29.0, 51.0, 91.0, 196.0, 276.0, 185.0, 73.0, 33.0, 17.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2721.724365234375, -2659.12890625, -2596.53369140625, -2533.9384765625, -2471.343017578125, -2408.74755859375, -2346.15234375, -2283.55712890625, -2220.961669921875, -2158.3662109375, -2095.77099609375, -2033.1756591796875, -1970.580322265625, -1907.9849853515625, -1845.3896484375, -1782.7943115234375, -1720.198974609375, -1657.6036376953125, -1595.00830078125, -1532.4129638671875, -1469.817626953125, -1407.2222900390625, -1344.626953125, -1282.0316162109375, -1219.436279296875, -1156.8409423828125, -1094.24560546875, -1031.6502685546875, -969.054931640625, -906.4595947265625, -843.8642578125, -781.2689208984375, -718.6737060546875, -656.078369140625, -593.4830322265625, -530.8876953125, -468.2923583984375, -405.697021484375, -343.1016845703125, -280.50634765625, -217.9110107421875, -155.315673828125, -92.7203369140625, -30.125, 32.4703369140625, 95.065673828125, 157.6610107421875, 220.25634765625, 282.8516845703125, 345.447021484375, 408.0423583984375, 470.6376953125, 533.2330322265625, 595.828369140625, 658.4237060546875, 721.01904296875, 783.6143798828125, 846.209716796875, 908.8050537109375, 971.400390625, 1033.9957275390625, 1096.591064453125, 1159.1864013671875, 1221.78173828125, 1284.3770751953125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 0.0, 7.0, 6.0, 7.0, 17.0, 16.0, 18.0, 16.0, 24.0, 26.0, 32.0, 30.0, 41.0, 35.0, 50.0, 58.0, 37.0, 63.0, 61.0, 66.0, 53.0, 48.0, 36.0, 36.0, 32.0, 35.0, 26.0, 25.0, 27.0, 15.0, 20.0, 11.0, 7.0, 7.0, 8.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-964.9420166015625, -938.08447265625, -911.2269287109375, -884.3693237304688, -857.5117797851562, -830.6542358398438, -803.7966918945312, -776.9390869140625, -750.08154296875, -723.2239990234375, -696.366455078125, -669.5088500976562, -642.6513061523438, -615.7937622070312, -588.9362182617188, -562.07861328125, -535.2210693359375, -508.363525390625, -481.5059509277344, -454.6484069824219, -427.79083251953125, -400.93328857421875, -374.07574462890625, -347.2181701660156, -320.36065673828125, -293.50311279296875, -266.6455383300781, -239.78799438476562, -212.930419921875, -186.0728759765625, -159.21531677246094, -132.35775756835938, -105.50018310546875, -78.64262390136719, -51.78506851196289, -24.927513122558594, 1.9300460815429688, 28.78759765625, 55.64515686035156, 82.50271606445312, 109.36027526855469, 136.21783447265625, 163.0753936767578, 189.93295288085938, 216.79049682617188, 243.64805603027344, 270.505615234375, 297.3631591796875, 324.2207336425781, 351.0782775878906, 377.93585205078125, 404.79339599609375, 431.6509704589844, 458.5085144042969, 485.3660888671875, 512.2236328125, 539.0811767578125, 565.938720703125, 592.7962646484375, 619.6538696289062, 646.5114135742188, 673.3689575195312, 700.2265014648438, 727.0841064453125, 753.941650390625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 11.0, 15.0, 18.0, 27.0, 33.0, 53.0, 69.0, 113.0, 120.0, 194.0, 307.0, 441.0, 713.0, 1125.0, 1678.0, 2789.0, 4809.0, 8674.0, 16713.0, 35223.0, 80969.0, 217450.0, 387829.0, 164331.0, 63900.0, 28732.0, 14040.0, 7402.0, 4099.0, 2356.0, 1510.0, 959.0, 594.0, 379.0, 254.0, 202.0, 134.0, 85.0, 56.0, 37.0, 24.0, 23.0, 18.0, 10.0, 10.0, 10.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 4.0], "bins": [-103.9375, -100.822265625, -97.70703125, -94.591796875, -91.4765625, -88.361328125, -85.24609375, -82.130859375, -79.015625, -75.900390625, -72.78515625, -69.669921875, -66.5546875, -63.439453125, -60.32421875, -57.208984375, -54.09375, -50.978515625, -47.86328125, -44.748046875, -41.6328125, -38.517578125, -35.40234375, -32.287109375, -29.171875, -26.056640625, -22.94140625, -19.826171875, -16.7109375, -13.595703125, -10.48046875, -7.365234375, -4.25, -1.134765625, 1.98046875, 5.095703125, 8.2109375, 11.326171875, 14.44140625, 17.556640625, 20.671875, 23.787109375, 26.90234375, 30.017578125, 33.1328125, 36.248046875, 39.36328125, 42.478515625, 45.59375, 48.708984375, 51.82421875, 54.939453125, 58.0546875, 61.169921875, 64.28515625, 67.400390625, 70.515625, 73.630859375, 76.74609375, 79.861328125, 82.9765625, 86.091796875, 89.20703125, 92.322265625, 95.4375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 8.0, 4.0, 8.0, 9.0, 9.0, 21.0, 15.0, 21.0, 29.0, 22.0, 30.0, 42.0, 42.0, 49.0, 47.0, 49.0, 54.0, 54.0, 64.0, 63.0, 56.0, 38.0, 51.0, 54.0, 34.0, 22.0, 18.0, 16.0, 9.0, 19.0, 11.0, 14.0, 6.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-77.5625, -75.1650390625, -72.767578125, -70.3701171875, -67.97265625, -65.5751953125, -63.177734375, -60.7802734375, -58.3828125, -55.9853515625, -53.587890625, -51.1904296875, -48.79296875, -46.3955078125, -43.998046875, -41.6005859375, -39.203125, -36.8056640625, -34.408203125, -32.0107421875, -29.61328125, -27.2158203125, -24.818359375, -22.4208984375, -20.0234375, -17.6259765625, -15.228515625, -12.8310546875, -10.43359375, -8.0361328125, -5.638671875, -3.2412109375, -0.84375, 1.5537109375, 3.951171875, 6.3486328125, 8.74609375, 11.1435546875, 13.541015625, 15.9384765625, 18.3359375, 20.7333984375, 23.130859375, 25.5283203125, 27.92578125, 30.3232421875, 32.720703125, 35.1181640625, 37.515625, 39.9130859375, 42.310546875, 44.7080078125, 47.10546875, 49.5029296875, 51.900390625, 54.2978515625, 56.6953125, 59.0927734375, 61.490234375, 63.8876953125, 66.28515625, 68.6826171875, 71.080078125, 73.4775390625, 75.875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 5.0, 7.0, 16.0, 9.0, 17.0, 30.0, 30.0, 35.0, 59.0, 85.0, 120.0, 213.0, 294.0, 517.0, 945.0, 2413.0, 8884.0, 65193.0, 861234.0, 91366.0, 11394.0, 2871.0, 1159.0, 602.0, 363.0, 221.0, 150.0, 99.0, 60.0, 48.0, 38.0, 16.0, 16.0, 12.0, 5.0, 13.0, 5.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-294.75, -286.22265625, -277.6953125, -269.16796875, -260.640625, -252.11328125, -243.5859375, -235.05859375, -226.53125, -218.00390625, -209.4765625, -200.94921875, -192.421875, -183.89453125, -175.3671875, -166.83984375, -158.3125, -149.78515625, -141.2578125, -132.73046875, -124.203125, -115.67578125, -107.1484375, -98.62109375, -90.09375, -81.56640625, -73.0390625, -64.51171875, -55.984375, -47.45703125, -38.9296875, -30.40234375, -21.875, -13.34765625, -4.8203125, 3.70703125, 12.234375, 20.76171875, 29.2890625, 37.81640625, 46.34375, 54.87109375, 63.3984375, 71.92578125, 80.453125, 88.98046875, 97.5078125, 106.03515625, 114.5625, 123.08984375, 131.6171875, 140.14453125, 148.671875, 157.19921875, 165.7265625, 174.25390625, 182.78125, 191.30859375, 199.8359375, 208.36328125, 216.890625, 225.41796875, 233.9453125, 242.47265625, 251.0]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 6.0, 4.0, 9.0, 13.0, 25.0, 18.0, 23.0, 30.0, 50.0, 43.0, 87.0, 78.0, 63.0, 82.0, 75.0, 82.0, 67.0, 47.0, 39.0, 35.0, 38.0, 23.0, 15.0, 17.0, 8.0, 8.0, 8.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-439.75, -428.2421875, -416.734375, -405.2265625, -393.71875, -382.2109375, -370.703125, -359.1953125, -347.6875, -336.1796875, -324.671875, -313.1640625, -301.65625, -290.1484375, -278.640625, -267.1328125, -255.625, -244.1171875, -232.609375, -221.1015625, -209.59375, -198.0859375, -186.578125, -175.0703125, -163.5625, -152.0546875, -140.546875, -129.0390625, -117.53125, -106.0234375, -94.515625, -83.0078125, -71.5, -59.9921875, -48.484375, -36.9765625, -25.46875, -13.9609375, -2.453125, 9.0546875, 20.5625, 32.0703125, 43.578125, 55.0859375, 66.59375, 78.1015625, 89.609375, 101.1171875, 112.625, 124.1328125, 135.640625, 147.1484375, 158.65625, 170.1640625, 181.671875, 193.1796875, 204.6875, 216.1953125, 227.703125, 239.2109375, 250.71875, 262.2265625, 273.734375, 285.2421875, 296.75]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 4.0, 11.0, 17.0, 20.0, 20.0, 38.0, 39.0, 66.0, 86.0, 140.0, 251.0, 491.0, 1228.0, 3550.0, 17237.0, 172997.0, 797199.0, 44558.0, 6988.0, 1974.0, 708.0, 363.0, 191.0, 125.0, 78.0, 42.0, 27.0, 21.0, 19.0, 15.0, 6.0, 8.0, 7.0, 4.0, 3.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-58.46875, -56.5966796875, -54.724609375, -52.8525390625, -50.98046875, -49.1083984375, -47.236328125, -45.3642578125, -43.4921875, -41.6201171875, -39.748046875, -37.8759765625, -36.00390625, -34.1318359375, -32.259765625, -30.3876953125, -28.515625, -26.6435546875, -24.771484375, -22.8994140625, -21.02734375, -19.1552734375, -17.283203125, -15.4111328125, -13.5390625, -11.6669921875, -9.794921875, -7.9228515625, -6.05078125, -4.1787109375, -2.306640625, -0.4345703125, 1.4375, 3.3095703125, 5.181640625, 7.0537109375, 8.92578125, 10.7978515625, 12.669921875, 14.5419921875, 16.4140625, 18.2861328125, 20.158203125, 22.0302734375, 23.90234375, 25.7744140625, 27.646484375, 29.5185546875, 31.390625, 33.2626953125, 35.134765625, 37.0068359375, 38.87890625, 40.7509765625, 42.623046875, 44.4951171875, 46.3671875, 48.2392578125, 50.111328125, 51.9833984375, 53.85546875, 55.7275390625, 57.599609375, 59.4716796875, 61.34375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 10.0, 14.0, 20.0, 18.0, 27.0, 37.0, 56.0, 95.0, 112.0, 158.0, 150.0, 98.0, 56.0, 45.0, 26.0, 17.0, 16.0, 9.0, 11.0, 9.0, 3.0, 7.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.024383544921875, -0.023798465728759766, -0.02321338653564453, -0.022628307342529297, -0.022043228149414062, -0.021458148956298828, -0.020873069763183594, -0.02028799057006836, -0.019702911376953125, -0.01911783218383789, -0.018532752990722656, -0.017947673797607422, -0.017362594604492188, -0.016777515411376953, -0.01619243621826172, -0.015607357025146484, -0.01502227783203125, -0.014437198638916016, -0.013852119445800781, -0.013267040252685547, -0.012681961059570312, -0.012096881866455078, -0.011511802673339844, -0.01092672348022461, -0.010341644287109375, -0.00975656509399414, -0.009171485900878906, -0.008586406707763672, -0.008001327514648438, -0.007416248321533203, -0.006831169128417969, -0.006246089935302734, -0.0056610107421875, -0.005075931549072266, -0.004490852355957031, -0.003905773162841797, -0.0033206939697265625, -0.002735614776611328, -0.0021505355834960938, -0.0015654563903808594, -0.000980377197265625, -0.0003952980041503906, 0.00018978118896484375, 0.0007748603820800781, 0.0013599395751953125, 0.0019450187683105469, 0.0025300979614257812, 0.0031151771545410156, 0.00370025634765625, 0.004285335540771484, 0.004870414733886719, 0.005455493927001953, 0.0060405731201171875, 0.006625652313232422, 0.007210731506347656, 0.007795810699462891, 0.008380889892578125, 0.00896596908569336, 0.009551048278808594, 0.010136127471923828, 0.010721206665039062, 0.011306285858154297, 0.011891365051269531, 0.012476444244384766, 0.0130615234375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 8.0, 9.0, 17.0, 25.0, 52.0, 78.0, 126.0, 281.0, 563.0, 1583.0, 5896.0, 51253.0, 903651.0, 74618.0, 7274.0, 1806.0, 659.0, 277.0, 162.0, 91.0, 38.0, 26.0, 27.0, 10.0, 1.0, 7.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.3125, -71.880859375, -69.44921875, -67.017578125, -64.5859375, -62.154296875, -59.72265625, -57.291015625, -54.859375, -52.427734375, -49.99609375, -47.564453125, -45.1328125, -42.701171875, -40.26953125, -37.837890625, -35.40625, -32.974609375, -30.54296875, -28.111328125, -25.6796875, -23.248046875, -20.81640625, -18.384765625, -15.953125, -13.521484375, -11.08984375, -8.658203125, -6.2265625, -3.794921875, -1.36328125, 1.068359375, 3.5, 5.931640625, 8.36328125, 10.794921875, 13.2265625, 15.658203125, 18.08984375, 20.521484375, 22.953125, 25.384765625, 27.81640625, 30.248046875, 32.6796875, 35.111328125, 37.54296875, 39.974609375, 42.40625, 44.837890625, 47.26953125, 49.701171875, 52.1328125, 54.564453125, 56.99609375, 59.427734375, 61.859375, 64.291015625, 66.72265625, 69.154296875, 71.5859375, 74.017578125, 76.44921875, 78.880859375, 81.3125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 5.0, 6.0, 11.0, 5.0, 27.0, 12.0, 15.0, 26.0, 34.0, 43.0, 55.0, 59.0, 101.0, 103.0, 103.0, 92.0, 63.0, 45.0, 45.0, 30.0, 32.0, 16.0, 20.0, 12.0, 13.0, 11.0, 6.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.46875, -47.15576171875, -45.8427734375, -44.52978515625, -43.216796875, -41.90380859375, -40.5908203125, -39.27783203125, -37.96484375, -36.65185546875, -35.3388671875, -34.02587890625, -32.712890625, -31.39990234375, -30.0869140625, -28.77392578125, -27.4609375, -26.14794921875, -24.8349609375, -23.52197265625, -22.208984375, -20.89599609375, -19.5830078125, -18.27001953125, -16.95703125, -15.64404296875, -14.3310546875, -13.01806640625, -11.705078125, -10.39208984375, -9.0791015625, -7.76611328125, -6.453125, -5.14013671875, -3.8271484375, -2.51416015625, -1.201171875, 0.11181640625, 1.4248046875, 2.73779296875, 4.05078125, 5.36376953125, 6.6767578125, 7.98974609375, 9.302734375, 10.61572265625, 11.9287109375, 13.24169921875, 14.5546875, 15.86767578125, 17.1806640625, 18.49365234375, 19.806640625, 21.11962890625, 22.4326171875, 23.74560546875, 25.05859375, 26.37158203125, 27.6845703125, 28.99755859375, 30.310546875, 31.62353515625, 32.9365234375, 34.24951171875, 35.5625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 6.0, 26.0, 66.0, 142.0, 400.0, 168.0, 93.0, 41.0, 18.0, 7.0, 10.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1384.5438232421875, -1334.343505859375, -1284.1431884765625, -1233.94287109375, -1183.7425537109375, -1133.542236328125, -1083.342041015625, -1033.1416015625, -982.9413452148438, -932.7410278320312, -882.5407104492188, -832.3404541015625, -782.14013671875, -731.9398193359375, -681.739501953125, -631.5391845703125, -581.3388671875, -531.1385498046875, -480.938232421875, -430.7379455566406, -380.5376281738281, -330.3373107910156, -280.13702392578125, -229.93670654296875, -179.73638916015625, -129.53607177734375, -79.33576965332031, -29.135467529296875, 21.064849853515625, 71.26516723632812, 121.4654541015625, 171.665771484375, 221.8660888671875, 272.06640625, 322.2667236328125, 372.4670104980469, 422.6673278808594, 472.8676452636719, 523.0679321289062, 573.2682495117188, 623.4685668945312, 673.6688842773438, 723.8692016601562, 774.0694580078125, 824.269775390625, 874.4700927734375, 924.67041015625, 974.8707275390625, 1025.071044921875, 1075.2713623046875, 1125.4716796875, 1175.6719970703125, 1225.872314453125, 1276.0726318359375, 1326.27294921875, 1376.47314453125, 1426.673583984375, 1476.8739013671875, 1527.07421875, 1577.2745361328125, 1627.474853515625, 1677.6751708984375, 1727.87548828125, 1778.07568359375, 1828.2760009765625]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 5.0, 7.0, 7.0, 14.0, 10.0, 14.0, 17.0, 17.0, 20.0, 35.0, 39.0, 27.0, 36.0, 56.0, 134.0, 135.0, 76.0, 36.0, 43.0, 53.0, 25.0, 38.0, 27.0, 23.0, 26.0, 12.0, 14.0, 10.0, 14.0, 9.0, 5.0, 5.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1186.6971435546875, -1154.6898193359375, -1122.6824951171875, -1090.6751708984375, -1058.6678466796875, -1026.66064453125, -994.6532592773438, -962.6459350585938, -930.638671875, -898.63134765625, -866.6240234375, -834.61669921875, -802.6094360351562, -770.6021118164062, -738.5947875976562, -706.5874633789062, -674.5801391601562, -642.5728149414062, -610.5654907226562, -578.5582275390625, -546.5509033203125, -514.5435791015625, -482.5362548828125, -450.5289306640625, -418.5216369628906, -386.5143127441406, -354.50701904296875, -322.49969482421875, -290.49237060546875, -258.4850769042969, -226.47775268554688, -194.47044372558594, -162.46319580078125, -130.4558868408203, -98.44857025146484, -66.44125366210938, -34.43394470214844, -2.4266357421875, 29.5806884765625, 61.58799743652344, 93.59530639648438, 125.60261535644531, 157.60992431640625, 189.61724853515625, 221.6245574951172, 253.63186645507812, 285.6391906738281, 317.646484375, 349.65380859375, 381.6611328125, 413.6684265136719, 445.6757507324219, 477.68304443359375, 509.69036865234375, 541.6976928710938, 573.7050170898438, 605.7122802734375, 637.7196044921875, 669.7269287109375, 701.7342529296875, 733.7415161132812, 765.7488403320312, 797.7561645507812, 829.7634887695312, 861.7708129882812]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 29.0, 31.0, 58.0, 92.0, 153.0, 279.0, 480.0, 949.0, 1763.0, 4229.0, 11613.0, 46207.0, 396282.0, 2770284.0, 852849.0, 82150.0, 16750.0, 5482.0, 2319.0, 1068.0, 563.0, 295.0, 146.0, 94.0, 41.0, 36.0, 14.0, 14.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-214.875, -209.9521484375, -205.029296875, -200.1064453125, -195.18359375, -190.2607421875, -185.337890625, -180.4150390625, -175.4921875, -170.5693359375, -165.646484375, -160.7236328125, -155.80078125, -150.8779296875, -145.955078125, -141.0322265625, -136.109375, -131.1865234375, -126.263671875, -121.3408203125, -116.41796875, -111.4951171875, -106.572265625, -101.6494140625, -96.7265625, -91.8037109375, -86.880859375, -81.9580078125, -77.03515625, -72.1123046875, -67.189453125, -62.2666015625, -57.34375, -52.4208984375, -47.498046875, -42.5751953125, -37.65234375, -32.7294921875, -27.806640625, -22.8837890625, -17.9609375, -13.0380859375, -8.115234375, -3.1923828125, 1.73046875, 6.6533203125, 11.576171875, 16.4990234375, 21.421875, 26.3447265625, 31.267578125, 36.1904296875, 41.11328125, 46.0361328125, 50.958984375, 55.8818359375, 60.8046875, 65.7275390625, 70.650390625, 75.5732421875, 80.49609375, 85.4189453125, 90.341796875, 95.2646484375, 100.1875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 8.0, 6.0, 7.0, 9.0, 18.0, 22.0, 25.0, 32.0, 26.0, 30.0, 46.0, 47.0, 29.0, 54.0, 70.0, 49.0, 62.0, 62.0, 64.0, 60.0, 54.0, 39.0, 35.0, 25.0, 38.0, 15.0, 15.0, 15.0, 11.0, 9.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.4375, -67.1845703125, -64.931640625, -62.6787109375, -60.42578125, -58.1728515625, -55.919921875, -53.6669921875, -51.4140625, -49.1611328125, -46.908203125, -44.6552734375, -42.40234375, -40.1494140625, -37.896484375, -35.6435546875, -33.390625, -31.1376953125, -28.884765625, -26.6318359375, -24.37890625, -22.1259765625, -19.873046875, -17.6201171875, -15.3671875, -13.1142578125, -10.861328125, -8.6083984375, -6.35546875, -4.1025390625, -1.849609375, 0.4033203125, 2.65625, 4.9091796875, 7.162109375, 9.4150390625, 11.66796875, 13.9208984375, 16.173828125, 18.4267578125, 20.6796875, 22.9326171875, 25.185546875, 27.4384765625, 29.69140625, 31.9443359375, 34.197265625, 36.4501953125, 38.703125, 40.9560546875, 43.208984375, 45.4619140625, 47.71484375, 49.9677734375, 52.220703125, 54.4736328125, 56.7265625, 58.9794921875, 61.232421875, 63.4853515625, 65.73828125, 67.9912109375, 70.244140625, 72.4970703125, 74.75]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 6.0, 4.0, 10.0, 12.0, 23.0, 33.0, 62.0, 115.0, 216.0, 415.0, 981.0, 3277.0, 24562.0, 3492128.0, 655825.0, 12643.0, 2356.0, 782.0, 372.0, 188.0, 95.0, 58.0, 38.0, 28.0, 7.0, 15.0, 11.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-430.5, -418.15625, -405.8125, -393.46875, -381.125, -368.78125, -356.4375, -344.09375, -331.75, -319.40625, -307.0625, -294.71875, -282.375, -270.03125, -257.6875, -245.34375, -233.0, -220.65625, -208.3125, -195.96875, -183.625, -171.28125, -158.9375, -146.59375, -134.25, -121.90625, -109.5625, -97.21875, -84.875, -72.53125, -60.1875, -47.84375, -35.5, -23.15625, -10.8125, 1.53125, 13.875, 26.21875, 38.5625, 50.90625, 63.25, 75.59375, 87.9375, 100.28125, 112.625, 124.96875, 137.3125, 149.65625, 162.0, 174.34375, 186.6875, 199.03125, 211.375, 223.71875, 236.0625, 248.40625, 260.75, 273.09375, 285.4375, 297.78125, 310.125, 322.46875, 334.8125, 347.15625, 359.5]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 12.0, 11.0, 20.0, 33.0, 52.0, 77.0, 112.0, 188.0, 311.0, 461.0, 722.0, 775.0, 487.0, 286.0, 181.0, 116.0, 78.0, 46.0, 33.0, 16.0, 15.0, 11.0, 4.0, 10.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-218.75, -210.68359375, -202.6171875, -194.55078125, -186.484375, -178.41796875, -170.3515625, -162.28515625, -154.21875, -146.15234375, -138.0859375, -130.01953125, -121.953125, -113.88671875, -105.8203125, -97.75390625, -89.6875, -81.62109375, -73.5546875, -65.48828125, -57.421875, -49.35546875, -41.2890625, -33.22265625, -25.15625, -17.08984375, -9.0234375, -0.95703125, 7.109375, 15.17578125, 23.2421875, 31.30859375, 39.375, 47.44140625, 55.5078125, 63.57421875, 71.640625, 79.70703125, 87.7734375, 95.83984375, 103.90625, 111.97265625, 120.0390625, 128.10546875, 136.171875, 144.23828125, 152.3046875, 160.37109375, 168.4375, 176.50390625, 184.5703125, 192.63671875, 200.703125, 208.76953125, 216.8359375, 224.90234375, 232.96875, 241.03515625, 249.1015625, 257.16796875, 265.234375, 273.30078125, 281.3671875, 289.43359375, 297.5]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 3.0, 7.0, 13.0, 15.0, 23.0, 26.0, 54.0, 61.0, 107.0, 130.0, 161.0, 122.0, 84.0, 52.0, 35.0, 32.0, 21.0, 10.0, 14.0, 9.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1948.8421630859375, -1896.525390625, -1844.208740234375, -1791.8919677734375, -1739.5751953125, -1687.2584228515625, -1634.941650390625, -1582.625, -1530.3082275390625, -1477.991455078125, -1425.6748046875, -1373.3580322265625, -1321.041259765625, -1268.7244873046875, -1216.40771484375, -1164.091064453125, -1111.7742919921875, -1059.45751953125, -1007.1408081054688, -954.8240966796875, -902.50732421875, -850.1905517578125, -797.8738403320312, -745.55712890625, -693.2403564453125, -640.923583984375, -588.6068725585938, -536.2901611328125, -483.973388671875, -431.6566467285156, -379.33990478515625, -327.0231628417969, -274.7064208984375, -222.38967895507812, -170.07293701171875, -117.75619506835938, -65.439453125, -13.122711181640625, 39.19403076171875, 91.51077270507812, 143.8275146484375, 196.14425659179688, 248.46099853515625, 300.7777404785156, 353.094482421875, 405.4112243652344, 457.72796630859375, 510.0447082519531, 562.3614501953125, 614.67822265625, 666.9949340820312, 719.3116455078125, 771.62841796875, 823.9451904296875, 876.2619018554688, 928.57861328125, 980.8953857421875, 1033.212158203125, 1085.52880859375, 1137.8455810546875, 1190.162353515625, 1242.4791259765625, 1294.7958984375, 1347.112548828125, 1399.4293212890625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 10.0, 3.0, 9.0, 10.0, 9.0, 5.0, 20.0, 13.0, 17.0, 20.0, 24.0, 32.0, 28.0, 33.0, 29.0, 42.0, 37.0, 43.0, 45.0, 57.0, 51.0, 45.0, 63.0, 38.0, 34.0, 39.0, 34.0, 33.0, 21.0, 22.0, 17.0, 16.0, 22.0, 17.0, 19.0, 7.0, 7.0, 4.0, 14.0, 6.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1089.88134765625, -1058.121337890625, -1026.361328125, -994.601318359375, -962.84130859375, -931.081298828125, -899.3212890625, -867.561279296875, -835.80126953125, -804.041259765625, -772.28125, -740.521240234375, -708.76123046875, -677.001220703125, -645.2412109375, -613.481201171875, -581.7211303710938, -549.9611206054688, -518.2011108398438, -486.44110107421875, -454.68109130859375, -422.92108154296875, -391.1610412597656, -359.4010314941406, -327.6410217285156, -295.8810119628906, -264.1210021972656, -232.36097717285156, -200.60096740722656, -168.84095764160156, -137.0809326171875, -105.3209228515625, -73.5609130859375, -41.800899505615234, -10.040885925292969, 21.719131469726562, 53.47914123535156, 85.23915100097656, 116.99917602539062, 148.75918579101562, 180.51919555664062, 212.27920532226562, 244.03921508789062, 275.79925537109375, 307.55926513671875, 339.31927490234375, 371.07928466796875, 402.83929443359375, 434.59930419921875, 466.35931396484375, 498.11932373046875, 529.8793334960938, 561.6393432617188, 593.3993530273438, 625.159423828125, 656.91943359375, 688.679443359375, 720.439453125, 752.199462890625, 783.95947265625, 815.719482421875, 847.4794921875, 879.239501953125, 910.99951171875, 942.759521484375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 9.0, 10.0, 16.0, 28.0, 41.0, 72.0, 108.0, 225.0, 381.0, 656.0, 1149.0, 2293.0, 4814.0, 11279.0, 30841.0, 113661.0, 633154.0, 180230.0, 42767.0, 14790.0, 6113.0, 2800.0, 1388.0, 735.0, 441.0, 221.0, 122.0, 85.0, 59.0, 28.0, 10.0, 12.0, 8.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.1875, -89.4052734375, -85.623046875, -81.8408203125, -78.05859375, -74.2763671875, -70.494140625, -66.7119140625, -62.9296875, -59.1474609375, -55.365234375, -51.5830078125, -47.80078125, -44.0185546875, -40.236328125, -36.4541015625, -32.671875, -28.8896484375, -25.107421875, -21.3251953125, -17.54296875, -13.7607421875, -9.978515625, -6.1962890625, -2.4140625, 1.3681640625, 5.150390625, 8.9326171875, 12.71484375, 16.4970703125, 20.279296875, 24.0615234375, 27.84375, 31.6259765625, 35.408203125, 39.1904296875, 42.97265625, 46.7548828125, 50.537109375, 54.3193359375, 58.1015625, 61.8837890625, 65.666015625, 69.4482421875, 73.23046875, 77.0126953125, 80.794921875, 84.5771484375, 88.359375, 92.1416015625, 95.923828125, 99.7060546875, 103.48828125, 107.2705078125, 111.052734375, 114.8349609375, 118.6171875, 122.3994140625, 126.181640625, 129.9638671875, 133.74609375, 137.5283203125, 141.310546875, 145.0927734375, 148.875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 2.0, 4.0, 6.0, 2.0, 8.0, 2.0, 9.0, 7.0, 11.0, 15.0, 18.0, 18.0, 11.0, 22.0, 21.0, 20.0, 17.0, 29.0, 32.0, 31.0, 26.0, 29.0, 42.0, 38.0, 35.0, 32.0, 40.0, 48.0, 46.0, 38.0, 34.0, 36.0, 28.0, 32.0, 26.0, 35.0, 28.0, 12.0, 19.0, 15.0, 11.0, 13.0, 5.0, 11.0, 7.0, 3.0, 6.0, 6.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0, 1.0], "bins": [-60.96875, -59.1533203125, -57.337890625, -55.5224609375, -53.70703125, -51.8916015625, -50.076171875, -48.2607421875, -46.4453125, -44.6298828125, -42.814453125, -40.9990234375, -39.18359375, -37.3681640625, -35.552734375, -33.7373046875, -31.921875, -30.1064453125, -28.291015625, -26.4755859375, -24.66015625, -22.8447265625, -21.029296875, -19.2138671875, -17.3984375, -15.5830078125, -13.767578125, -11.9521484375, -10.13671875, -8.3212890625, -6.505859375, -4.6904296875, -2.875, -1.0595703125, 0.755859375, 2.5712890625, 4.38671875, 6.2021484375, 8.017578125, 9.8330078125, 11.6484375, 13.4638671875, 15.279296875, 17.0947265625, 18.91015625, 20.7255859375, 22.541015625, 24.3564453125, 26.171875, 27.9873046875, 29.802734375, 31.6181640625, 33.43359375, 35.2490234375, 37.064453125, 38.8798828125, 40.6953125, 42.5107421875, 44.326171875, 46.1416015625, 47.95703125, 49.7724609375, 51.587890625, 53.4033203125, 55.21875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 7.0, 2.0, 5.0, 4.0, 13.0, 21.0, 14.0, 30.0, 30.0, 47.0, 67.0, 99.0, 122.0, 225.0, 319.0, 624.0, 1235.0, 3047.0, 10994.0, 71860.0, 895142.0, 50567.0, 8800.0, 2614.0, 1109.0, 512.0, 333.0, 203.0, 144.0, 105.0, 63.0, 53.0, 42.0, 27.0, 18.0, 13.0, 10.0, 7.0, 7.0, 3.0, 6.0, 7.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-172.375, -167.05859375, -161.7421875, -156.42578125, -151.109375, -145.79296875, -140.4765625, -135.16015625, -129.84375, -124.52734375, -119.2109375, -113.89453125, -108.578125, -103.26171875, -97.9453125, -92.62890625, -87.3125, -81.99609375, -76.6796875, -71.36328125, -66.046875, -60.73046875, -55.4140625, -50.09765625, -44.78125, -39.46484375, -34.1484375, -28.83203125, -23.515625, -18.19921875, -12.8828125, -7.56640625, -2.25, 3.06640625, 8.3828125, 13.69921875, 19.015625, 24.33203125, 29.6484375, 34.96484375, 40.28125, 45.59765625, 50.9140625, 56.23046875, 61.546875, 66.86328125, 72.1796875, 77.49609375, 82.8125, 88.12890625, 93.4453125, 98.76171875, 104.078125, 109.39453125, 114.7109375, 120.02734375, 125.34375, 130.66015625, 135.9765625, 141.29296875, 146.609375, 151.92578125, 157.2421875, 162.55859375, 167.875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 2.0, 9.0, 9.0, 9.0, 14.0, 13.0, 11.0, 15.0, 28.0, 21.0, 27.0, 24.0, 40.0, 48.0, 53.0, 48.0, 88.0, 77.0, 59.0, 67.0, 51.0, 41.0, 40.0, 27.0, 20.0, 27.0, 18.0, 12.0, 11.0, 14.0, 9.0, 14.0, 14.0, 3.0, 9.0, 6.0, 2.0, 3.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-298.25, -289.296875, -280.34375, -271.390625, -262.4375, -253.484375, -244.53125, -235.578125, -226.625, -217.671875, -208.71875, -199.765625, -190.8125, -181.859375, -172.90625, -163.953125, -155.0, -146.046875, -137.09375, -128.140625, -119.1875, -110.234375, -101.28125, -92.328125, -83.375, -74.421875, -65.46875, -56.515625, -47.5625, -38.609375, -29.65625, -20.703125, -11.75, -2.796875, 6.15625, 15.109375, 24.0625, 33.015625, 41.96875, 50.921875, 59.875, 68.828125, 77.78125, 86.734375, 95.6875, 104.640625, 113.59375, 122.546875, 131.5, 140.453125, 149.40625, 158.359375, 167.3125, 176.265625, 185.21875, 194.171875, 203.125, 212.078125, 221.03125, 229.984375, 238.9375, 247.890625, 256.84375, 265.796875, 274.75]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 2.0, 0.0, 5.0, 4.0, 7.0, 7.0, 12.0, 4.0, 6.0, 17.0, 12.0, 24.0, 34.0, 32.0, 80.0, 125.0, 140.0, 300.0, 625.0, 1619.0, 4105.0, 15492.0, 136556.0, 853782.0, 25724.0, 6122.0, 1989.0, 736.0, 396.0, 212.0, 124.0, 68.0, 49.0, 32.0, 27.0, 15.0, 15.0, 13.0, 12.0, 12.0, 6.0, 3.0, 3.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-40.4375, -39.1396484375, -37.841796875, -36.5439453125, -35.24609375, -33.9482421875, -32.650390625, -31.3525390625, -30.0546875, -28.7568359375, -27.458984375, -26.1611328125, -24.86328125, -23.5654296875, -22.267578125, -20.9697265625, -19.671875, -18.3740234375, -17.076171875, -15.7783203125, -14.48046875, -13.1826171875, -11.884765625, -10.5869140625, -9.2890625, -7.9912109375, -6.693359375, -5.3955078125, -4.09765625, -2.7998046875, -1.501953125, -0.2041015625, 1.09375, 2.3916015625, 3.689453125, 4.9873046875, 6.28515625, 7.5830078125, 8.880859375, 10.1787109375, 11.4765625, 12.7744140625, 14.072265625, 15.3701171875, 16.66796875, 17.9658203125, 19.263671875, 20.5615234375, 21.859375, 23.1572265625, 24.455078125, 25.7529296875, 27.05078125, 28.3486328125, 29.646484375, 30.9443359375, 32.2421875, 33.5400390625, 34.837890625, 36.1357421875, 37.43359375, 38.7314453125, 40.029296875, 41.3271484375, 42.625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 5.0, 2.0, 4.0, 4.0, 8.0, 7.0, 12.0, 13.0, 13.0, 12.0, 29.0, 38.0, 70.0, 100.0, 148.0, 171.0, 140.0, 76.0, 43.0, 25.0, 15.0, 12.0, 10.0, 15.0, 6.0, 11.0, 6.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01496124267578125, -0.014523625373840332, -0.014086008071899414, -0.013648390769958496, -0.013210773468017578, -0.01277315616607666, -0.012335538864135742, -0.011897921562194824, -0.011460304260253906, -0.011022686958312988, -0.01058506965637207, -0.010147452354431152, -0.009709835052490234, -0.009272217750549316, -0.008834600448608398, -0.00839698314666748, -0.007959365844726562, -0.0075217485427856445, -0.0070841312408447266, -0.006646513938903809, -0.006208896636962891, -0.005771279335021973, -0.005333662033081055, -0.004896044731140137, -0.004458427429199219, -0.004020810127258301, -0.003583192825317383, -0.003145575523376465, -0.002707958221435547, -0.002270340919494629, -0.001832723617553711, -0.001395106315612793, -0.000957489013671875, -0.000519871711730957, -8.225440979003906e-05, 0.0003553628921508789, 0.0007929801940917969, 0.0012305974960327148, 0.0016682147979736328, 0.0021058320999145508, 0.0025434494018554688, 0.0029810667037963867, 0.0034186840057373047, 0.0038563013076782227, 0.004293918609619141, 0.004731535911560059, 0.0051691532135009766, 0.0056067705154418945, 0.0060443878173828125, 0.0064820051193237305, 0.0069196224212646484, 0.007357239723205566, 0.007794857025146484, 0.008232474327087402, 0.00867009162902832, 0.009107708930969238, 0.009545326232910156, 0.009982943534851074, 0.010420560836791992, 0.01085817813873291, 0.011295795440673828, 0.011733412742614746, 0.012171030044555664, 0.012608647346496582, 0.0130462646484375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 5.0, 7.0, 5.0, 13.0, 19.0, 31.0, 45.0, 68.0, 106.0, 165.0, 260.0, 508.0, 880.0, 1787.0, 3929.0, 10093.0, 37729.0, 848956.0, 113916.0, 18433.0, 6140.0, 2617.0, 1220.0, 650.0, 343.0, 215.0, 122.0, 88.0, 69.0, 39.0, 17.0, 17.0, 20.0, 6.0, 3.0, 3.0, 10.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-30.03125, -29.02197265625, -28.0126953125, -27.00341796875, -25.994140625, -24.98486328125, -23.9755859375, -22.96630859375, -21.95703125, -20.94775390625, -19.9384765625, -18.92919921875, -17.919921875, -16.91064453125, -15.9013671875, -14.89208984375, -13.8828125, -12.87353515625, -11.8642578125, -10.85498046875, -9.845703125, -8.83642578125, -7.8271484375, -6.81787109375, -5.80859375, -4.79931640625, -3.7900390625, -2.78076171875, -1.771484375, -0.76220703125, 0.2470703125, 1.25634765625, 2.265625, 3.27490234375, 4.2841796875, 5.29345703125, 6.302734375, 7.31201171875, 8.3212890625, 9.33056640625, 10.33984375, 11.34912109375, 12.3583984375, 13.36767578125, 14.376953125, 15.38623046875, 16.3955078125, 17.40478515625, 18.4140625, 19.42333984375, 20.4326171875, 21.44189453125, 22.451171875, 23.46044921875, 24.4697265625, 25.47900390625, 26.48828125, 27.49755859375, 28.5068359375, 29.51611328125, 30.525390625, 31.53466796875, 32.5439453125, 33.55322265625, 34.5625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 8.0, 4.0, 9.0, 5.0, 15.0, 9.0, 12.0, 12.0, 15.0, 22.0, 24.0, 31.0, 47.0, 77.0, 131.0, 121.0, 134.0, 96.0, 62.0, 36.0, 29.0, 15.0, 22.0, 13.0, 7.0, 4.0, 6.0, 7.0, 9.0, 8.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-35.875, -34.869873046875, -33.86474609375, -32.859619140625, -31.8544921875, -30.849365234375, -29.84423828125, -28.839111328125, -27.833984375, -26.828857421875, -25.82373046875, -24.818603515625, -23.8134765625, -22.808349609375, -21.80322265625, -20.798095703125, -19.79296875, -18.787841796875, -17.78271484375, -16.777587890625, -15.7724609375, -14.767333984375, -13.76220703125, -12.757080078125, -11.751953125, -10.746826171875, -9.74169921875, -8.736572265625, -7.7314453125, -6.726318359375, -5.72119140625, -4.716064453125, -3.7109375, -2.705810546875, -1.70068359375, -0.695556640625, 0.3095703125, 1.314697265625, 2.31982421875, 3.324951171875, 4.330078125, 5.335205078125, 6.34033203125, 7.345458984375, 8.3505859375, 9.355712890625, 10.36083984375, 11.365966796875, 12.37109375, 13.376220703125, 14.38134765625, 15.386474609375, 16.3916015625, 17.396728515625, 18.40185546875, 19.406982421875, 20.412109375, 21.417236328125, 22.42236328125, 23.427490234375, 24.4326171875, 25.437744140625, 26.44287109375, 27.447998046875, 28.453125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 10.0, 26.0, 37.0, 105.0, 586.0, 142.0, 46.0, 27.0, 13.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2980.706298828125, -2919.3466796875, -2857.987060546875, -2796.62744140625, -2735.267822265625, -2673.908203125, -2612.548583984375, -2551.18896484375, -2489.829345703125, -2428.4697265625, -2367.110107421875, -2305.75048828125, -2244.390869140625, -2183.03125, -2121.671630859375, -2060.31201171875, -1998.952392578125, -1937.5927734375, -1876.233154296875, -1814.87353515625, -1753.513916015625, -1692.154296875, -1630.794677734375, -1569.43505859375, -1508.075439453125, -1446.7158203125, -1385.356201171875, -1323.99658203125, -1262.636962890625, -1201.27734375, -1139.917724609375, -1078.55810546875, -1017.1986083984375, -955.8389892578125, -894.4793701171875, -833.1197509765625, -771.7601318359375, -710.4005126953125, -649.0408935546875, -587.6812744140625, -526.3216552734375, -464.9620361328125, -403.6024169921875, -342.2427978515625, -280.8831787109375, -219.5235595703125, -158.1639404296875, -96.8043212890625, -35.4447021484375, 25.9149169921875, 87.2745361328125, 148.6341552734375, 209.9937744140625, 271.3533935546875, 332.7130126953125, 394.0726318359375, 455.4322509765625, 516.7918701171875, 578.1514892578125, 639.5111083984375, 700.8707275390625, 762.2303466796875, 823.5899658203125, 884.9495849609375, 946.3092041015625]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 6.0, 9.0, 3.0, 8.0, 9.0, 5.0, 13.0, 12.0, 12.0, 18.0, 16.0, 29.0, 29.0, 28.0, 31.0, 32.0, 130.0, 297.0, 94.0, 27.0, 27.0, 27.0, 28.0, 20.0, 25.0, 13.0, 12.0, 11.0, 9.0, 11.0, 4.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-863.6160888671875, -833.2435913085938, -802.87109375, -772.4986572265625, -742.1261596679688, -711.753662109375, -681.3811645507812, -651.0086669921875, -620.63623046875, -590.2637329101562, -559.8912353515625, -529.518798828125, -499.14630126953125, -468.7738037109375, -438.40130615234375, -408.0288391113281, -377.6563415527344, -347.2838439941406, -316.911376953125, -286.53887939453125, -256.1664123535156, -225.79391479492188, -195.4214324951172, -165.0489501953125, -134.6764678955078, -104.30398559570312, -73.93150329589844, -43.55901336669922, -13.186531066894531, 17.185958862304688, 47.558441162109375, 77.93092346191406, 108.30340576171875, 138.67588806152344, 169.04837036132812, 199.42086791992188, 229.7933349609375, 260.16583251953125, 290.538330078125, 320.9107971191406, 351.28326416015625, 381.65576171875, 412.0282287597656, 442.4007263183594, 472.773193359375, 503.14569091796875, 533.5181884765625, 563.890625, 594.26318359375, 624.6356811523438, 655.0081787109375, 685.380615234375, 715.7531127929688, 746.1256103515625, 776.4981079101562, 806.87060546875, 837.2430419921875, 867.6155395507812, 897.988037109375, 928.3604736328125, 958.7329711914062, 989.10546875, 1019.4779663085938, 1049.8504638671875, 1080.222900390625]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 2.0, 4.0, 8.0, 8.0, 7.0, 4.0, 7.0, 12.0, 13.0, 7.0, 17.0, 22.0, 30.0, 14.0, 26.0, 18.0, 39.0, 52.0, 113.0, 216.0, 88.0, 44.0, 29.0, 38.0, 25.0, 22.0, 24.0, 19.0, 20.0, 10.0, 8.0, 11.0, 9.0, 5.0, 5.0, 8.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.5625, -58.560546875, -56.55859375, -54.556640625, -52.5546875, -50.552734375, -48.55078125, -46.548828125, -44.546875, -42.544921875, -40.54296875, -38.541015625, -36.5390625, -34.537109375, -32.53515625, -30.533203125, -28.53125, -26.529296875, -24.52734375, -22.525390625, -20.5234375, -18.521484375, -16.51953125, -14.517578125, -12.515625, -10.513671875, -8.51171875, -6.509765625, -4.5078125, -2.505859375, -0.50390625, 1.498046875, 3.5, 5.501953125, 7.50390625, 9.505859375, 11.5078125, 13.509765625, 15.51171875, 17.513671875, 19.515625, 21.517578125, 23.51953125, 25.521484375, 27.5234375, 29.525390625, 31.52734375, 33.529296875, 35.53125, 37.533203125, 39.53515625, 41.537109375, 43.5390625, 45.541015625, 47.54296875, 49.544921875, 51.546875, 53.548828125, 55.55078125, 57.552734375, 59.5546875, 61.556640625, 63.55859375, 65.560546875, 67.5625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 7.0, 7.0, 3.0, 5.0, 4.0, 2.0, 7.0, 7.0, 13.0, 14.0, 28.0, 25.0, 38.0, 59.0, 89.0, 142.0, 233.0, 446.0, 1063.0, 2659.0, 9143.0, 8171796.0, 191191.0, 7378.0, 2284.0, 911.0, 400.0, 217.0, 118.0, 76.0, 58.0, 37.0, 22.0, 17.0, 21.0, 7.0, 12.0, 9.0, 12.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0], "bins": [-526.0886840820312, -509.07855224609375, -492.06842041015625, -475.05828857421875, -458.0481262207031, -441.0379943847656, -424.0278625488281, -407.0177307128906, -390.007568359375, -372.9974365234375, -355.9873046875, -338.9771728515625, -321.9670104980469, -304.9568786621094, -287.9467468261719, -270.9366149902344, -253.92648315429688, -236.91635131835938, -219.9062042236328, -202.8960723876953, -185.88592529296875, -168.87579345703125, -151.86566162109375, -134.85552978515625, -117.84538269042969, -100.83524322509766, -83.82510375976562, -66.81497192382812, -49.804832458496094, -32.79469299316406, -15.784561157226562, 1.2255783081054688, 18.2357177734375, 35.24585723876953, 52.2559928894043, 69.26612854003906, 86.2762680053711, 103.28640747070312, 120.29653930664062, 137.30667114257812, 154.3168182373047, 171.3269500732422, 188.33709716796875, 205.34722900390625, 222.35736083984375, 239.3675079345703, 256.37762451171875, 273.3877868652344, 290.3979187011719, 307.4080505371094, 324.4181823730469, 341.4283447265625, 358.4384765625, 375.4486083984375, 392.458740234375, 409.4688720703125, 426.47900390625, 443.4891357421875, 460.499267578125, 477.5093994140625, 494.5195617675781, 511.5296936035156, 528.539794921875, 545.5499877929688, 562.5601196289062]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 2.0, 1.0, 5.0, 5.0, 3.0, 3.0, 5.0, 5.0, 6.0, 5.0, 6.0, 7.0, 3.0, 1.0, 3.0, 5.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-451.5982360839844, -436.83544921875, -422.07269287109375, -407.3099060058594, -392.5471496582031, -377.78436279296875, -363.0216064453125, -348.2588195800781, -333.4960632324219, -318.7332763671875, -303.97052001953125, -289.2077331542969, -274.4449768066406, -259.68218994140625, -244.91943359375, -230.15664672851562, -215.3938751220703, -200.631103515625, -185.8683319091797, -171.10556030273438, -156.34278869628906, -141.58001708984375, -126.8172378540039, -112.0544662475586, -97.29169464111328, -82.52892303466797, -67.76615142822266, -53.00337600708008, -38.240604400634766, -23.477828979492188, -8.715057373046875, 6.0477142333984375, 20.81048583984375, 35.57325744628906, 50.336029052734375, 65.09880065917969, 79.861572265625, 94.62435150146484, 109.38712310791016, 124.14989471435547, 138.91265869140625, 153.67543029785156, 168.43820190429688, 183.2009735107422, 197.9637451171875, 212.72653198242188, 227.48928833007812, 242.2520751953125, 257.01483154296875, 271.7776184082031, 286.5403747558594, 301.30316162109375, 316.06591796875, 330.8287048339844, 345.5914611816406, 360.354248046875, 375.1170349121094, 389.87982177734375, 404.642578125, 419.4053649902344, 434.1681213378906, 448.930908203125, 463.69366455078125, 478.4564514160156, 493.2192077636719]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 6.0, 7.0, 6.0, 17.0, 23.0, 25.0, 43.0, 82.0, 167.0, 391.0, 1185.0, 5453.0, 57775.0, 396275.0, 55927.0, 5122.0, 1099.0, 345.0, 146.0, 73.0, 41.0, 20.0, 11.0, 6.0, 8.0, 6.0, 4.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1380.0, -1334.75, -1289.5, -1244.25, -1199.0, -1153.75, -1108.5, -1063.25, -1018.0, -972.75, -927.5, -882.25, -837.0, -791.75, -746.5, -701.25, -656.0, -610.75, -565.5, -520.25, -475.0, -429.75, -384.5, -339.25, -294.0, -248.75, -203.5, -158.25, -113.0, -67.75, -22.5, 22.75, 68.0, 113.25, 158.5, 203.75, 249.0, 294.25, 339.5, 384.75, 430.0, 475.25, 520.5, 565.75, 611.0, 656.25, 701.5, 746.75, 792.0, 837.25, 882.5, 927.75, 973.0, 1018.25, 1063.5, 1108.75, 1154.0, 1199.25, 1244.5, 1289.75, 1335.0, 1380.25, 1425.5, 1470.75, 1516.0]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 2.0, 2.0, 5.0, 7.0, 9.0, 10.0, 11.0, 17.0, 30.0, 21.0, 19.0, 21.0, 30.0, 35.0, 33.0, 44.0, 47.0, 50.0, 60.0, 60.0, 40.0, 55.0, 42.0, 73.0, 39.0, 28.0, 29.0, 32.0, 28.0, 20.0, 8.0, 20.0, 13.0, 11.0, 6.0, 7.0, 5.0, 7.0, 5.0, 6.0, 0.0, 3.0, 2.0, 7.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-59.21875, -57.13330078125, -55.0478515625, -52.96240234375, -50.876953125, -48.79150390625, -46.7060546875, -44.62060546875, -42.53515625, -40.44970703125, -38.3642578125, -36.27880859375, -34.193359375, -32.10791015625, -30.0224609375, -27.93701171875, -25.8515625, -23.76611328125, -21.6806640625, -19.59521484375, -17.509765625, -15.42431640625, -13.3388671875, -11.25341796875, -9.16796875, -7.08251953125, -4.9970703125, -2.91162109375, -0.826171875, 1.25927734375, 3.3447265625, 5.43017578125, 7.515625, 9.60107421875, 11.6865234375, 13.77197265625, 15.857421875, 17.94287109375, 20.0283203125, 22.11376953125, 24.19921875, 26.28466796875, 28.3701171875, 30.45556640625, 32.541015625, 34.62646484375, 36.7119140625, 38.79736328125, 40.8828125, 42.96826171875, 45.0537109375, 47.13916015625, 49.224609375, 51.31005859375, 53.3955078125, 55.48095703125, 57.56640625, 59.65185546875, 61.7373046875, 63.82275390625, 65.908203125, 67.99365234375, 70.0791015625, 72.16455078125, 74.25]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 4.0, 1.0, 4.0, 10.0, 8.0, 12.0, 17.0, 35.0, 72.0, 114.0, 84.0, 56.0, 16.0, 13.0, 11.0, 8.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-569.3441772460938, -548.782470703125, -528.220703125, -507.65899658203125, -487.0972595214844, -466.5355224609375, -445.97381591796875, -425.4120788574219, -404.850341796875, -384.2886047363281, -363.72686767578125, -343.1651611328125, -322.6034240722656, -302.04168701171875, -281.47998046875, -260.9182434082031, -240.35650634765625, -219.79476928710938, -199.23304748535156, -178.67132568359375, -158.10958862304688, -137.5478515625, -116.98612976074219, -96.42440795898438, -75.8626708984375, -55.300941467285156, -34.73921203613281, -14.177482604980469, 6.384246826171875, 26.94597625732422, 47.50770568847656, 68.06942749023438, 88.631103515625, 109.19283294677734, 129.7545623779297, 150.3162841796875, 170.87802124023438, 191.43975830078125, 212.00148010253906, 232.56320190429688, 253.12493896484375, 273.6866760253906, 294.2484130859375, 314.81011962890625, 335.3718566894531, 355.93359375, 376.49530029296875, 397.0570373535156, 417.6187744140625, 438.1805114746094, 458.74224853515625, 479.303955078125, 499.8656921386719, 520.4274291992188, 540.9891357421875, 561.5509033203125, 582.1126098632812, 602.67431640625, 623.236083984375, 643.7977905273438, 664.3594970703125, 684.9212646484375, 705.4829711914062, 726.044677734375, 746.6064453125]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 6.0, 7.0, 9.0, 20.0, 18.0, 49.0, 60.0, 75.0, 51.0, 43.0, 29.0, 19.0, 22.0, 7.0, 5.0, 3.0, 6.0, 6.0, 5.0, 8.0, 3.0, 3.0, 5.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-343.83245849609375, -332.7225341796875, -321.6125793457031, -310.50262451171875, -299.3927001953125, -288.28277587890625, -277.1728210449219, -266.0628662109375, -254.95294189453125, -243.84300231933594, -232.73306274414062, -221.6231231689453, -210.51318359375, -199.4032440185547, -188.29330444335938, -177.18336486816406, -166.07342529296875, -154.96348571777344, -143.85354614257812, -132.7436065673828, -121.6336669921875, -110.52372741699219, -99.41378784179688, -88.30384826660156, -77.19390869140625, -66.08396911621094, -54.974029541015625, -43.86408996582031, -32.754150390625, -21.644210815429688, -10.534271240234375, 0.5756683349609375, 11.685577392578125, 22.795516967773438, 33.90545654296875, 45.01539611816406, 56.125335693359375, 67.23527526855469, 78.34521484375, 89.45515441894531, 100.56509399414062, 111.67503356933594, 122.78497314453125, 133.89491271972656, 145.00485229492188, 156.1147918701172, 167.2247314453125, 178.3346710205078, 189.44461059570312, 200.55455017089844, 211.66448974609375, 222.77442932128906, 233.88436889648438, 244.9943084716797, 256.104248046875, 267.21417236328125, 278.3241271972656, 289.43408203125, 300.54400634765625, 311.6539306640625, 322.7638854980469, 333.87384033203125, 344.9837646484375, 356.09368896484375, 367.2036437988281]}, "eval/loss": 6.748763084411621, "eval/wer": 1.2782506895251702, "eval/runtime": 1382.3061, "eval/samples_per_second": 1.911, "eval/steps_per_second": 0.478} \ No newline at end of file